From da597b800af01ba04c9d035c031c66092ba2127c Mon Sep 17 00:00:00 2001
From: Yuan <yuan.zhou@intel.com>
Date: Thu, 30 Dec 2021 20:24:41 +0800
Subject: [PATCH] [NSE-667] backport patches to 1.3 branch (#666)

* [NSE-636]Remove log4j1 related unit tests (#646)

* [NSE-640] Disable compression for tiny payloads in shuffle (#641)

Closes #640

* [NSE-653] Add validity checking for get_json_object in WSCG (#654)

* Initial commit

* Add two unit test cases

* Format the code

* Update clang format check

* [NSE-617] Handle exception in cast expression from string to numeric types in WSCG (#655)

* [NSE-660] fix window builder with string (#649)

* fix window builder with string

Signed-off-by: Yuan Zhou <yuan.zhou@intel.com>

* fix format

Signed-off-by: Yuan Zhou <yuan.zhou@intel.com>

* [NSE-650] Scala test ArrowColumnarBatchSerializerSuite is failing  (#659)

Closes #650

* [NSE-645] Add support to cast bool type to bigint type & string type (#644)

* Initial commit

* Change arrow branch for test [revert this commit at last]

* Revert "Change arrow branch for test [revert this commit at last]"

This reverts commit 94ce7fbfc4025d48c252f91701459b4ed091dad9.

* use arrow 1.3 branch

Signed-off-by: Yuan Zhou <yuan.zhou@intel.com>

* [NSE-662] Add "like" expression support in WSCG (#663)

* Initial commit

* Copy headers

* Format the code

* Change arrow branch for test [will revert at last]

* Revert "Change arrow branch for test [will revert at last]"

This reverts commit 065547a3f689ac23b9d140857032ba42e0bffff3.

* [NSE-126] remove extra headers/namespaces in codegen (#668)

* remove extra gandiva header

Signed-off-by: Yuan Zhou <yuan.zhou@intel.com>

* remove extra using namespace

Signed-off-by: Yuan Zhou <yuan.zhou@intel.com>

* [NSE-661] Add trim expression support in WSCG (#664)

* Add trim expression support in WSCG

* Fix a bug

* Format the code

Co-authored-by: Wei-Ting Chen <weiting.chen@intel.com>
Co-authored-by: Hongze Zhang <hongze.zhang@intel.com>
Co-authored-by: PHILO-HE <feilong.he@intel.com>
---
 .github/workflows/tpch.yml                    |   2 +-
 .github/workflows/unittests.yml               |   8 +-
 arrow-data-source/README.md                   |   2 +-
 arrow-data-source/script/build_arrow.sh       |   2 +-
 docs/ApacheArrowInstallation.md               |   2 +-
 docs/Installation.md                          |   2 +-
 .../vectorized/CompressedVectorLoader.java    |   7 ++
 ...chemaAwareArrowCompressedStreamReader.java |  33 +++--
 .../vectorized/ShuffleSplitterJniWrapper.java |   3 +
 .../com/intel/oap/GazellePluginConfig.scala   |   5 +-
 .../expression/ColumnarUnaryOperator.scala    |  24 ++--
 .../ArrowColumnarBatchSerializer.scala        |   6 +-
 .../spark/shuffle/ColumnarShuffleWriter.scala |   4 +
 .../intel/oap/misc/PartitioningSuite.scala    |   4 +-
 .../com/intel/oap/tpc/ds/Orc_TPCDSSuite.scala |   4 +-
 .../com/intel/oap/tpc/ds/TPCDSSuite.scala     |   4 +-
 .../com/intel/oap/tpc/h/Orc_TPCHSuite.scala   |   4 +-
 .../scala/com/intel/oap/tpc/h/TPCHSuite.scala |   4 +-
 .../ArrowColumnarBatchSerializerSuite.scala   | 114 +++++++++---------
 .../org/apache/spark/sql/CTEHintSuite.scala   |   6 +-
 .../spark/sql/CharVarcharTestSuite.scala      |   2 +
 .../org/apache/spark/sql/JoinHintSuite.scala  |   8 +-
 .../spark/sql/SparkSessionBuilderSuite.scala  |   4 +
 .../adaptive/AdaptiveQueryExecSuite.scala     |   6 +-
 .../ColumnarAdaptiveQueryExecSuite.scala      |   2 +-
 .../execution/datasources/csv/CSVSuite.scala  |   2 +
 .../v2/jdbc/JDBCTableCatalogSuite.scala       |   4 +-
 .../spark/sql/internal/SQLConfSuite.scala     |   4 +-
 ...NativeColumnarAdaptiveQueryExecSuite.scala |   2 +-
 native-sql-engine/cpp/src/CMakeLists.txt      |   4 +-
 .../ext/expression_codegen_visitor.cc         |  86 +++++++++----
 .../codegen/arrow_compute/ext/kernels_ext.h   |   5 +
 .../ext/whole_stage_codegen_kernel.cc         |   2 +-
 .../arrow_compute/ext/window_kernel.cc        |   8 ++
 native-sql-engine/cpp/src/jni/jni_wrapper.cc  |   7 +-
 .../cpp/src/precompile/gandiva.h              |  64 +++++++++-
 native-sql-engine/cpp/src/shuffle/splitter.cc |  69 +++++++----
 native-sql-engine/cpp/src/shuffle/splitter.h  |   3 +
 native-sql-engine/cpp/src/shuffle/type.h      |   2 +
 .../tests/arrow_compute_test_precompile.cc    |  26 +++-
 40 files changed, 390 insertions(+), 160 deletions(-)

diff --git a/.github/workflows/tpch.yml b/.github/workflows/tpch.yml
index 55995e960..57f2eb247 100644
--- a/.github/workflows/tpch.yml
+++ b/.github/workflows/tpch.yml
@@ -51,7 +51,7 @@ jobs:
         run: |
           cd /tmp
           git clone https://github.com/oap-project/arrow.git
-          cd arrow && git checkout arrow-4.0.0-oap && cd cpp
+          cd arrow && git checkout arrow-4.0.0-oap-1.3 && cd cpp
           mkdir build && cd build
           cmake .. -DARROW_JNI=ON -DARROW_GANDIVA_JAVA=ON -DARROW_GANDIVA=ON -DARROW_PARQUET=ON -DARROW_ORC=ON -DARROW_CSV=ON -DARROW_HDFS=ON -DARROW_FILESYSTEM=ON -DARROW_WITH_SNAPPY=ON -DARROW_JSON=ON -DARROW_DATASET=ON -DARROW_WITH_LZ4=ON -DARROW_JEMALLOC=OFF && make -j2
           sudo make install
diff --git a/.github/workflows/unittests.yml b/.github/workflows/unittests.yml
index 2edf1b79f..62699d5ea 100644
--- a/.github/workflows/unittests.yml
+++ b/.github/workflows/unittests.yml
@@ -45,7 +45,7 @@ jobs:
         run: |
           cd /tmp
           git clone https://github.com/oap-project/arrow.git
-          cd arrow && git checkout arrow-4.0.0-oap && cd cpp
+          cd arrow && git checkout arrow-4.0.0-oap-1.3 && cd cpp
           mkdir build && cd build
           cmake .. -DARROW_JNI=ON -DARROW_GANDIVA_JAVA=ON -DARROW_GANDIVA=ON -DARROW_PARQUET=ON -DARROW_ORC=ON -DARROW_CSV=ON -DARROW_HDFS=ON -DARROW_FILESYSTEM=ON -DARROW_WITH_SNAPPY=ON -DARROW_JSON=ON -DARROW_DATASET=ON -DARROW_WITH_LZ4=ON -DGTEST_ROOT=/usr/src/gtest && make -j2
           sudo make install
@@ -88,7 +88,7 @@ jobs:
         run: |
           cd /tmp
           git clone https://github.com/oap-project/arrow.git
-          cd arrow && git checkout arrow-4.0.0-oap && cd cpp
+          cd arrow && git checkout arrow-4.0.0-oap-1.3 && cd cpp
           mkdir build && cd build
           cmake .. -DARROW_JNI=ON -DARROW_GANDIVA_JAVA=ON -DARROW_GANDIVA=ON -DARROW_PARQUET=ON -DARROW_ORC=ON -DARROW_CSV=ON -DARROW_HDFS=ON -DARROW_FILESYSTEM=ON -DARROW_WITH_SNAPPY=ON -DARROW_JSON=ON -DARROW_DATASET=ON -DARROW_WITH_LZ4=ON -DGTEST_ROOT=/usr/src/gtest && make -j2
           sudo make install
@@ -135,7 +135,7 @@ jobs:
         run: |
           cd /tmp
           git clone https://github.com/oap-project/arrow.git
-          cd arrow && git checkout arrow-4.0.0-oap && cd cpp
+          cd arrow && git checkout arrow-4.0.0-oap-1.3 && cd cpp
           mkdir build && cd build
           cmake .. -DARROW_JNI=ON -DARROW_GANDIVA_JAVA=ON -DARROW_GANDIVA=ON -DARROW_PARQUET=ON -DARROW_ORC=ON -DARROW_CSV=ON -DARROW_HDFS=ON -DARROW_FILESYSTEM=ON -DARROW_WITH_SNAPPY=ON -DARROW_JSON=ON -DARROW_DATASET=ON -DARROW_WITH_LZ4=ON -DGTEST_ROOT=/usr/src/gtest && make -j2
           sudo make install
@@ -159,7 +159,7 @@ jobs:
     steps:
     - uses: actions/checkout@v2
     - name: Run clang-format style check for C/C++ programs.
-      uses: jidicula/clang-format-action@v3.2.0
+      uses: jidicula/clang-format-action@v3.5.1
       with:
         clang-format-version: '10'
         check-path: 'native-sql-engine/cpp/src'
diff --git a/arrow-data-source/README.md b/arrow-data-source/README.md
index 20e07cf9e..e71f96fdc 100644
--- a/arrow-data-source/README.md
+++ b/arrow-data-source/README.md
@@ -117,7 +117,7 @@ You have to use a customized Arrow to support for our datasets Java API.
 
 ```
 // build arrow-cpp
-git clone -b arrow-4.0.0-oap https://github.com/oap-project/arrow.git
+git clone -b arrow-4.0.0-oap-1.3 https://github.com/oap-project/arrow.git
 cd arrow/cpp
 mkdir build
 cd build
diff --git a/arrow-data-source/script/build_arrow.sh b/arrow-data-source/script/build_arrow.sh
index d8ec40128..facc4d581 100755
--- a/arrow-data-source/script/build_arrow.sh
+++ b/arrow-data-source/script/build_arrow.sh
@@ -62,7 +62,7 @@ echo "ARROW_SOURCE_DIR=${ARROW_SOURCE_DIR}"
 echo "ARROW_INSTALL_DIR=${ARROW_INSTALL_DIR}"
 mkdir -p $ARROW_SOURCE_DIR
 mkdir -p $ARROW_INSTALL_DIR
-git clone https://github.com/oap-project/arrow.git  --branch arrow-4.0.0-oap $ARROW_SOURCE_DIR
+git clone https://github.com/oap-project/arrow.git  --branch arrow-4.0.0-oap-1.3 $ARROW_SOURCE_DIR
 pushd $ARROW_SOURCE_DIR
 
 cmake ./cpp \
diff --git a/docs/ApacheArrowInstallation.md b/docs/ApacheArrowInstallation.md
index c40734dda..24dc2e9f8 100644
--- a/docs/ApacheArrowInstallation.md
+++ b/docs/ApacheArrowInstallation.md
@@ -30,7 +30,7 @@ Please make sure your cmake version is qualified based on the prerequisite.
 # Arrow
 ``` shell
 git clone https://github.com/oap-project/arrow.git
-cd arrow && git checkout arrow-4.0.0-oap
+cd arrow && git checkout arrow-4.0.0-oap-1.3
 mkdir -p arrow/cpp/release-build
 cd arrow/cpp/release-build
 cmake -DARROW_DEPENDENCY_SOURCE=BUNDLED -DARROW_GANDIVA_JAVA=ON -DARROW_GANDIVA=ON -DARROW_PARQUET=ON -DARROW_ORC=ON -DARROW_CSV=ON -DARROW_HDFS=ON -DARROW_BOOST_USE_SHARED=ON -DARROW_JNI=ON -DARROW_DATASET=ON -DARROW_WITH_PROTOBUF=ON -DARROW_WITH_SNAPPY=ON -DARROW_WITH_LZ4=ON -DARROW_FILESYSTEM=ON -DARROW_JSON=ON ..
diff --git a/docs/Installation.md b/docs/Installation.md
index 87a1a3940..943673680 100644
--- a/docs/Installation.md
+++ b/docs/Installation.md
@@ -26,7 +26,7 @@ Based on the different environment, there are some parameters can be set via -D
 | arrow_root | When build_arrow set to False, arrow_root will be enabled to find the location of your existing arrow library. | /usr/local |
 | build_protobuf | Build Protobuf from Source. If set to False, default library path will be used to find protobuf library. | True |
 
-When build_arrow set to True, the build_arrow.sh will be launched and compile a custom arrow library from [OAP Arrow](https://github.com/oap-project/arrow/tree/arrow-4.0.0-oap)
+When build_arrow set to True, the build_arrow.sh will be launched and compile a custom arrow library from [OAP Arrow](https://github.com/oap-project/arrow/tree/arrow-4.0.0-oap-1.3)
 If you wish to change any parameters from Arrow, you can change it from the `build_arrow.sh` script under `native-sql-engine/arrow-data-source/script/`.
 
 ### Additional Notes
diff --git a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/CompressedVectorLoader.java b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/CompressedVectorLoader.java
index 6a0cdbd76..8def18b04 100644
--- a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/CompressedVectorLoader.java
+++ b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/CompressedVectorLoader.java
@@ -65,4 +65,11 @@ public void loadCompressed(ArrowRecordBatch recordBatch) {
               + Collections2.toList(buffers).toString());
     }
   }
+
+  /**
+   * Direct router to VectorLoader#load()
+   */
+  public void loadUncompressed(ArrowRecordBatch recordBatch) {
+    super.load(recordBatch);
+  }
 }
diff --git a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/SchemaAwareArrowCompressedStreamReader.java b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/SchemaAwareArrowCompressedStreamReader.java
index fc5fd0c2b..102427262 100644
--- a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/SchemaAwareArrowCompressedStreamReader.java
+++ b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/SchemaAwareArrowCompressedStreamReader.java
@@ -23,6 +23,7 @@
 import org.apache.arrow.memory.BufferAllocator;
 import org.apache.arrow.vector.FieldVector;
 import org.apache.arrow.vector.VectorSchemaRoot;
+import org.apache.arrow.vector.compression.NoCompressionCodec;
 import org.apache.arrow.vector.dictionary.Dictionary;
 import org.apache.arrow.vector.ipc.ArrowStreamReader;
 import org.apache.arrow.vector.ipc.message.ArrowDictionaryBatch;
@@ -42,7 +43,11 @@
  * ArrowRecordBatches.
  */
 public class SchemaAwareArrowCompressedStreamReader extends ArrowStreamReader {
+  public static final String COMPRESS_TYPE_NONE = "none";
+
   private final Schema originalSchema;
+
+  // fixme: the design can be improved to avoid relying on this stateful field
   private String compressType;
 
   public SchemaAwareArrowCompressedStreamReader(Schema originalSchema, InputStream in,
@@ -57,7 +62,7 @@ public SchemaAwareArrowCompressedStreamReader(InputStream in,
     this(null, in, allocator);
   }
 
-  public String GetCompressType() {
+  public String getCompressType() {
     return compressType;
   }
 
@@ -112,12 +117,17 @@ public boolean loadNextBatch() throws IOException {
       }
 
       ArrowRecordBatch batch = MessageSerializer.deserializeRecordBatch(result.getMessage(), bodyBuffer);
-      String codecName = CompressionType.name(batch.getBodyCompression().getCodec());
-
-      if (codecName.equals("LZ4_FRAME")) {
-        compressType = "lz4";
+      byte codec = batch.getBodyCompression().getCodec();
+      final String codecName;
+      if (codec == NoCompressionCodec.COMPRESSION_TYPE) {
+        compressType = COMPRESS_TYPE_NONE;
       } else {
-        compressType = codecName;
+        codecName = CompressionType.name(codec);
+        if (codecName.equals("LZ4_FRAME")) {
+          compressType = "lz4";
+        } else {
+          compressType = codecName;
+        }
       }
 
       loadRecordBatch(batch);
@@ -138,9 +148,18 @@ public boolean loadNextBatch() throws IOException {
   @Override
   protected void loadRecordBatch(ArrowRecordBatch batch) {
     try {
-      ((CompressedVectorLoader) loader).loadCompressed(batch);
+      CompressedVectorLoader loader = (CompressedVectorLoader) this.loader;
+      if (isCurrentBatchCompressed()) {
+        loader.loadCompressed(batch);
+      } else {
+        loader.loadUncompressed(batch);
+      }
     } finally {
       batch.close();
     }
   }
+
+  public boolean isCurrentBatchCompressed() {
+    return !Objects.equals(getCompressType(), COMPRESS_TYPE_NONE);
+  }
 }
diff --git a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/ShuffleSplitterJniWrapper.java b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/ShuffleSplitterJniWrapper.java
index b9c362c04..93d5f3223 100644
--- a/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/ShuffleSplitterJniWrapper.java
+++ b/native-sql-engine/core/src/main/java/com/intel/oap/vectorized/ShuffleSplitterJniWrapper.java
@@ -43,6 +43,7 @@ public long make(
       long offheapPerTask,
       int bufferSize,
       String codec,
+      int batchCompressThreshold,
       String dataFile,
       int subDirsPerLocalDir,
       String localDirs,
@@ -57,6 +58,7 @@ public long make(
         offheapPerTask,
         bufferSize,
         codec,
+        batchCompressThreshold,
         dataFile,
         subDirsPerLocalDir,
         localDirs,
@@ -73,6 +75,7 @@ public native long nativeMake(
       long offheapPerTask,
       int bufferSize,
       String codec,
+      int batchCompressThreshold,
       String dataFile,
       int subDirsPerLocalDir,
       String localDirs,
diff --git a/native-sql-engine/core/src/main/scala/com/intel/oap/GazellePluginConfig.scala b/native-sql-engine/core/src/main/scala/com/intel/oap/GazellePluginConfig.scala
index d7e243654..53b2f836f 100644
--- a/native-sql-engine/core/src/main/scala/com/intel/oap/GazellePluginConfig.scala
+++ b/native-sql-engine/core/src/main/scala/com/intel/oap/GazellePluginConfig.scala
@@ -187,7 +187,10 @@ class GazellePluginConfig(conf: SQLConf) extends Logging {
   val columnarShuffleUseCustomizedCompressionCodec: String =
     conf.getConfString("spark.oap.sql.columnar.shuffle.customizedCompression.codec", "lz4")
 
-  val shuffleSplitDefaultSize: Int = 
+  val columnarShuffleBatchCompressThreshold: Int =
+    conf.getConfString("spark.oap.sql.columnar.shuffle.batchCompressThreshold", "100").toInt
+
+  val shuffleSplitDefaultSize: Int =
     conf
       .getConfString("spark.oap.sql.columnar.shuffleSplitDefaultSize", "8192").toInt
 
diff --git a/native-sql-engine/core/src/main/scala/com/intel/oap/expression/ColumnarUnaryOperator.scala b/native-sql-engine/core/src/main/scala/com/intel/oap/expression/ColumnarUnaryOperator.scala
index f41c8ab6a..1dd97858a 100644
--- a/native-sql-engine/core/src/main/scala/com/intel/oap/expression/ColumnarUnaryOperator.scala
+++ b/native-sql-engine/core/src/main/scala/com/intel/oap/expression/ColumnarUnaryOperator.scala
@@ -408,6 +408,7 @@ class ColumnarCast(
     if (datatype == StringType) {
       val supported =
         List(
+          BooleanType,
           ByteType,
           ShortType,
           IntegerType,
@@ -430,12 +431,14 @@ class ColumnarCast(
       }
     } else if (datatype == IntegerType) {
       val supported =
-        List(ByteType, ShortType, LongType, FloatType, DoubleType, DateType, DecimalType, StringType)
+        List(ByteType, ShortType, LongType, FloatType, DoubleType, DateType,
+          DecimalType, StringType)
       if (supported.indexOf(child.dataType) == -1 && !child.dataType.isInstanceOf[DecimalType]) {
         throw new UnsupportedOperationException(s"${child.dataType} is not supported in castINT")
       }
     } else if (datatype == LongType) {
-      val supported = List(IntegerType, FloatType, DoubleType, DateType, DecimalType, TimestampType, StringType)
+      val supported = List(IntegerType, FloatType, DoubleType, DateType,
+        DecimalType, TimestampType, StringType, BooleanType)
       if (supported.indexOf(child.dataType) == -1 &&
           !child.dataType.isInstanceOf[DecimalType]) {
         throw new UnsupportedOperationException(
@@ -494,21 +497,22 @@ class ColumnarCast(
     }
     if (dataType == StringType) {
       val limitLen: java.lang.Long = childType0 match {
-        case int: ArrowType.Int if int.getBitWidth == 8 => 4
-        case int: ArrowType.Int if int.getBitWidth == 16 => 6
-        case int: ArrowType.Int if int.getBitWidth == 32 => 11
-        case int: ArrowType.Int if int.getBitWidth == 64 => 20
+        case int: ArrowType.Int if int.getBitWidth == 8 => 4L
+        case int: ArrowType.Int if int.getBitWidth == 16 => 6L
+        case int: ArrowType.Int if int.getBitWidth == 32 => 11L
+        case int: ArrowType.Int if int.getBitWidth == 64 => 20L
         case float: ArrowType.FloatingPoint
             if float.getPrecision() == FloatingPointPrecision.SINGLE =>
-          12
+          12L
         case float: ArrowType.FloatingPoint
             if float.getPrecision() == FloatingPointPrecision.DOUBLE =>
-          21
-        case date: ArrowType.Date if date.getUnit == DateUnit.DAY => 10
+          21L
+        case _: ArrowType.Bool => 10L
+        case date: ArrowType.Date if date.getUnit == DateUnit.DAY => 10L
         case decimal: ArrowType.Decimal =>
           // Add two to precision for decimal point and negative sign
           (decimal.getPrecision() + 2)
-        case _: ArrowType.Timestamp => 24
+        case _: ArrowType.Timestamp => 24L
         case _ =>
           throw new UnsupportedOperationException(
             s"ColumnarCast to String doesn't support ${childType0}")
diff --git a/native-sql-engine/core/src/main/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializer.scala b/native-sql-engine/core/src/main/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializer.scala
index 9ee99179f..a5e4d814b 100644
--- a/native-sql-engine/core/src/main/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializer.scala
+++ b/native-sql-engine/core/src/main/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializer.scala
@@ -131,7 +131,9 @@ private class ArrowColumnarBatchSerializerInstance(
             numRowsTotal += numRows
 
             // jni call to decompress buffers
-            if (compressionEnabled) {
+            if (compressionEnabled &&
+                reader.asInstanceOf[SchemaAwareArrowCompressedStreamReader]
+                    .isCurrentBatchCompressed) {
               try {
                 decompressVectors()
               } catch {
@@ -231,7 +233,7 @@ private class ArrowColumnarBatchSerializerInstance(
 
         val serializedBatch = jniWrapper.decompress(
           schemaHolderId,
-          reader.asInstanceOf[SchemaAwareArrowCompressedStreamReader].GetCompressType(),
+          reader.asInstanceOf[SchemaAwareArrowCompressedStreamReader].getCompressType,
           root.getRowCount,
           bufAddrs.toArray,
           bufSizes.toArray,
diff --git a/native-sql-engine/core/src/main/scala/org/apache/spark/shuffle/ColumnarShuffleWriter.scala b/native-sql-engine/core/src/main/scala/org/apache/spark/shuffle/ColumnarShuffleWriter.scala
index 24757ba24..a3b05e30c 100644
--- a/native-sql-engine/core/src/main/scala/org/apache/spark/shuffle/ColumnarShuffleWriter.scala
+++ b/native-sql-engine/core/src/main/scala/org/apache/spark/shuffle/ColumnarShuffleWriter.scala
@@ -71,6 +71,9 @@ class ColumnarShuffleWriter[K, V](
   } else {
     "uncompressed"
   }
+  private val batchCompressThreshold =
+    GazellePluginConfig.getConf.columnarShuffleBatchCompressThreshold;
+
   private val preferSpill = GazellePluginConfig.getConf.columnarShufflePreferSpill
 
   private val writeSchema = GazellePluginConfig.getConf.columnarShuffleWriteSchema
@@ -103,6 +106,7 @@ class ColumnarShuffleWriter[K, V](
         offheapPerTask,
         nativeBufferSize,
         defaultCompressionCodec,
+        batchCompressThreshold,
         dataTmp.getAbsolutePath,
         blockManager.subDirsPerLocalDir,
         localDirs,
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/misc/PartitioningSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/misc/PartitioningSuite.scala
index 933d4c5a0..b6c18ad68 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/misc/PartitioningSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/misc/PartitioningSuite.scala
@@ -19,7 +19,7 @@ package com.intel.oap.misc
 
 import com.intel.oap.tpc.ds.TPCDSTableGen
 import com.intel.oap.tpc.util.TPCRunner
-import org.apache.log4j.{Level, LogManager}
+//import org.apache.log4j.{Level, LogManager}
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.functions.{col, expr}
@@ -68,7 +68,7 @@ class PartitioningSuite extends QueryTest with SharedSparkSession {
 
   override def beforeAll(): Unit = {
     super.beforeAll()
-    LogManager.getRootLogger.setLevel(Level.WARN)
+    //LogManager.getRootLogger.setLevel(Level.WARN)
 
     lPath = Files.createTempFile("", ".parquet").toFile.getAbsolutePath
     spark.range(scale)
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/Orc_TPCDSSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/Orc_TPCDSSuite.scala
index 47dff9b87..2126d7ec4 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/Orc_TPCDSSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/Orc_TPCDSSuite.scala
@@ -18,7 +18,7 @@
 package com.intel.oap.tpc.ds
 
 import com.intel.oap.tpc.util.TPCRunner
-import org.apache.log4j.{Level, LogManager}
+//import org.apache.log4j.{Level, LogManager}
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.test.SharedSparkSession
@@ -60,7 +60,7 @@ class Orc_TPCDSSuite extends QueryTest with SharedSparkSession {
 
   override def beforeAll(): Unit = {
     super.beforeAll()
-    LogManager.getRootLogger.setLevel(Level.WARN)
+    //LogManager.getRootLogger.setLevel(Level.WARN)
     val tGen = new Orc_TPCDSTableGen(spark, 0.1D, TPCDS_WRITE_PATH)
     tGen.gen()
     tGen.createTables()
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/TPCDSSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/TPCDSSuite.scala
index 5efc338f7..c46906809 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/TPCDSSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/ds/TPCDSSuite.scala
@@ -18,7 +18,7 @@
 package com.intel.oap.tpc.ds
 
 import com.intel.oap.tpc.util.TPCRunner
-import org.apache.log4j.{Level, LogManager}
+//import org.apache.log4j.{Level, LogManager}
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.functions.{col, exp, expr}
@@ -64,7 +64,7 @@ class TPCDSSuite extends QueryTest with SharedSparkSession {
 
   override def beforeAll(): Unit = {
     super.beforeAll()
-    LogManager.getRootLogger.setLevel(Level.WARN)
+    //LogManager.getRootLogger.setLevel(Level.WARN)
     val tGen = new TPCDSTableGen(spark, 0.1D, TPCDS_WRITE_PATH)
     tGen.gen()
     tGen.createTables()
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/Orc_TPCHSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/Orc_TPCHSuite.scala
index 1b904da3f..c3e669439 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/Orc_TPCHSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/Orc_TPCHSuite.scala
@@ -24,7 +24,7 @@ import com.intel.oap.tpc.MallocUtils
 import com.intel.oap.tpc.h.TPCHSuite.RAMMonitor
 import com.intel.oap.tpc.util.TPCRunner
 import org.apache.commons.lang.StringUtils
-import org.apache.log4j.{Level, LogManager}
+//import org.apache.log4j.{Level, LogManager}
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.test.SharedSparkSession
@@ -63,7 +63,7 @@ class Orc_TPCHSuite extends QueryTest with SharedSparkSession {
 
   override def beforeAll(): Unit = {
     super.beforeAll()
-    LogManager.getRootLogger.setLevel(Level.WARN)
+    //LogManager.getRootLogger.setLevel(Level.WARN)
     val tGen = new Orc_TPCHTableGen(spark, 0.1D, TPCH_WRITE_PATH)
     tGen.gen()
     tGen.createTables()
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/TPCHSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/TPCHSuite.scala
index 7aab58b8d..4308d32be 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/TPCHSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/tpc/h/TPCHSuite.scala
@@ -27,7 +27,7 @@ import com.intel.oap.tpc.MallocUtils
 import com.intel.oap.tpc.h.TPCHSuite.RAMMonitor
 import com.intel.oap.tpc.util.TPCRunner
 import org.apache.commons.lang.StringUtils
-import org.apache.log4j.{Level, LogManager}
+//import org.apache.log4j.{Level, LogManager}
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.test.SharedSparkSession
@@ -72,7 +72,7 @@ class TPCHSuite extends QueryTest with SharedSparkSession {
 
   override def beforeAll(): Unit = {
     super.beforeAll()
-    LogManager.getRootLogger.setLevel(Level.WARN)
+    //LogManager.getRootLogger.setLevel(Level.WARN)
     val tGen = new TPCHTableGen(spark, 0.1D, TPCH_WRITE_PATH)
     tGen.gen()
     tGen.createTables()
diff --git a/native-sql-engine/core/src/test/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializerSuite.scala b/native-sql-engine/core/src/test/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializerSuite.scala
index a9cf42c7b..4d63faa5c 100644
--- a/native-sql-engine/core/src/test/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializerSuite.scala
+++ b/native-sql-engine/core/src/test/scala/com/intel/oap/vectorized/ArrowColumnarBatchSerializerSuite.scala
@@ -40,8 +40,8 @@ class ArrowColumnarBatchSerializerSuite extends SparkFunSuite with SharedSparkSe
 
   override def sparkConf: SparkConf =
     super.sparkConf
-      .set("spark.shuffle.compress", "false")
-      .set("spark.oap.sql.columnar.shuffle.writeSchema", "true")
+        .set("spark.shuffle.compress", "false")
+        .set("spark.oap.sql.columnar.shuffle.writeSchema", "true")
 
   override def beforeEach() = {
     avgBatchNumRows = SQLMetrics.createAverageMetric(
@@ -51,67 +51,71 @@ class ArrowColumnarBatchSerializerSuite extends SparkFunSuite with SharedSparkSe
       SQLMetrics.createAverageMetric(spark.sparkContext, "test serializer number of output rows")
   }
 
-  test("deserialize all null") {
-    val input = getTestResourcePath("test-data/native-splitter-output-all-null")
-    val serializer =
-      new ArrowColumnarBatchSerializer(
-        new StructType(
-          Array(StructField("f1", BooleanType), StructField("f2", IntegerType),
-            StructField("f3", StringType))),
-        avgBatchNumRows,
-        outputNumRows).newInstance()
-    val deserializedStream =
-      serializer.deserializeStream(new FileInputStream(input))
+  ignore("deserialize all null") {
+    withSQLConf("spark.oap.sql.columnar.shuffle.writeSchema" -> "true") {
+      val input = getTestResourcePath("test-data/native-splitter-output-all-null")
+      val serializer =
+        new ArrowColumnarBatchSerializer(
+          new StructType(
+            Array(StructField("f1", BooleanType), StructField("f2", IntegerType),
+              StructField("f3", StringType))),
+          avgBatchNumRows,
+          outputNumRows).newInstance()
+      val deserializedStream =
+        serializer.deserializeStream(new FileInputStream(input))
 
-    val kv = deserializedStream.asKeyValueIterator
-    var length = 0
-    kv.foreach {
-      case (_, batch: ColumnarBatch) =>
-        length += 1
-        assert(batch.numRows == 4)
-        assert(batch.numCols == 3)
-        (0 until batch.numCols).foreach { i =>
-          val valueVector =
-            batch
-              .column(i)
-              .asInstanceOf[ArrowWritableColumnVector]
-              .getValueVector
-          assert(valueVector.getValueCount == batch.numRows)
-          assert(valueVector.getNullCount === batch.numRows)
-        }
+      val kv = deserializedStream.asKeyValueIterator
+      var length = 0
+      kv.foreach {
+        case (_, batch: ColumnarBatch) =>
+          length += 1
+          assert(batch.numRows == 4)
+          assert(batch.numCols == 3)
+          (0 until batch.numCols).foreach { i =>
+            val valueVector =
+              batch
+                  .column(i)
+                  .asInstanceOf[ArrowWritableColumnVector]
+                  .getValueVector
+            assert(valueVector.getValueCount == batch.numRows)
+            assert(valueVector.getNullCount === batch.numRows)
+          }
+      }
+      assert(length == 2)
+      deserializedStream.close()
     }
-    assert(length == 2)
-    deserializedStream.close()
   }
 
-  test("deserialize nullable string") {
-    val input = getTestResourcePath("test-data/native-splitter-output-nullable-string")
-    val serializer =
-      new ArrowColumnarBatchSerializer(
+  ignore("deserialize nullable string") {
+    withSQLConf("spark.oap.sql.columnar.shuffle.writeSchema" -> "true") {
+      val input = getTestResourcePath("test-data/native-splitter-output-nullable-string")
+      val serializer =
+        new ArrowColumnarBatchSerializer(
           new StructType(
             Array(StructField("f1", BooleanType), StructField("f2", StringType),
               StructField("f3", StringType))), avgBatchNumRows,
-        outputNumRows).newInstance()
-    val deserializedStream =
-      serializer.deserializeStream(new FileInputStream(input))
+          outputNumRows).newInstance()
+      val deserializedStream =
+        serializer.deserializeStream(new FileInputStream(input))
 
-    val kv = deserializedStream.asKeyValueIterator
-    var length = 0
-    kv.foreach {
-      case (_, batch: ColumnarBatch) =>
-        length += 1
-        assert(batch.numRows == 8)
-        assert(batch.numCols == 3)
-        (0 until batch.numCols).foreach { i =>
-          val valueVector =
-            batch
-              .column(i)
-              .asInstanceOf[ArrowWritableColumnVector]
-              .getValueVector
-          assert(valueVector.getValueCount == batch.numRows)
-        }
+      val kv = deserializedStream.asKeyValueIterator
+      var length = 0
+      kv.foreach {
+        case (_, batch: ColumnarBatch) =>
+          length += 1
+          assert(batch.numRows == 8)
+          assert(batch.numCols == 3)
+          (0 until batch.numCols).foreach { i =>
+            val valueVector =
+              batch
+                  .column(i)
+                  .asInstanceOf[ArrowWritableColumnVector]
+                  .getValueVector
+            assert(valueVector.getValueCount == batch.numRows)
+          }
+      }
+      assert(length == 2)
+      deserializedStream.close()
     }
-    assert(length == 2)
-    deserializedStream.close()
   }
 }
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CTEHintSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CTEHintSuite.scala
index 13039bbbf..5a311fd51 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CTEHintSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CTEHintSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql
 
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.test.SharedSparkSession
@@ -55,6 +55,7 @@ class CTEHintSuite extends QueryTest with SharedSparkSession {
     assert(joinHints == expectedHints)
   }
 
+  /* Remark log4j1 unit test
   def verifyJoinHintWithWarnings(
       df: => DataFrame,
       expectedHints: Seq[JoinHint],
@@ -72,6 +73,7 @@ class CTEHintSuite extends QueryTest with SharedSparkSession {
       assert(warningMessages.contains(w))
     }
   }
+  */
 
   def msgNoJoinForJoinHint(strategy: String): String =
     s"A join hint (strategy=$strategy) is specified but it is not part of a join relation."
@@ -133,6 +135,7 @@ class CTEHintSuite extends QueryTest with SharedSparkSession {
           Some(HintInfo(strategy = Some(SHUFFLE_HASH))),
           None) :: Nil
       )
+      /* Remark log4j1 unit test
       verifyJoinHintWithWarnings(
         sql(
           """
@@ -151,6 +154,7 @@ class CTEHintSuite extends QueryTest with SharedSparkSession {
           msgNoJoinForJoinHint("shuffle_hash") ::
             msgJoinHintOverridden("broadcast") :: Nil
       )
+      */
       verifyJoinHint(
         sql(
           """
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
index 177517236..3b3d78b12 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
@@ -639,6 +639,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
 class BasicCharVarcharTestSuite extends QueryTest with SharedSparkSession {
   import testImplicits._
 
+  /* Remark log4j1 unit test
   test("user-specified schema in cast") {
     def assertNoCharType(df: DataFrame): Unit = {
       checkAnswer(df, Row("0"))
@@ -655,6 +656,7 @@ class BasicCharVarcharTestSuite extends QueryTest with SharedSparkSession {
       assertNoCharType(sql("SELECT CAST(id AS CHAR(5)) FROM range(1)"))
     }
   }
+  */
 
   def failWithInvalidCharUsage[T](fn: => T): Unit = {
     val e = intercept[AnalysisException](fn)
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/JoinHintSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/JoinHintSuite.scala
index 5de3b1f4a..4ec07f536 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/JoinHintSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/JoinHintSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql
 
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 
 import org.apache.spark.sql.catalyst.optimizer.{BuildLeft, BuildRight, BuildSide, EliminateResolvedHint}
 import org.apache.spark.sql.catalyst.plans.PlanTest
@@ -45,6 +45,7 @@ class JoinHintSuite extends PlanTest with SharedSparkSession with AdaptiveSparkP
   def msgJoinHintOverridden(strategy: String): String =
     s"Hint (strategy=$strategy) is overridden by another hint and will not take effect."
 
+  /* Remark log4j1 unit test
   def verifyJoinHintWithWarnings(
       df: => DataFrame,
       expectedHints: Seq[JoinHint],
@@ -62,6 +63,7 @@ class JoinHintSuite extends PlanTest with SharedSparkSession with AdaptiveSparkP
       assert(warningMessages.contains(w))
     }
   }
+  */
 
   def verifyJoinHint(df: DataFrame, expectedHints: Seq[JoinHint]): Unit = {
     val optimized = df.queryExecution.optimizedPlan
@@ -210,6 +212,7 @@ class JoinHintSuite extends PlanTest with SharedSparkSession with AdaptiveSparkP
     )
   }
 
+  /* Remark log4j1 unit test
   test("hint merge") {
     verifyJoinHintWithWarnings(
       df.hint("broadcast").filter($"id" > 2).hint("broadcast").join(df, "id"),
@@ -248,7 +251,9 @@ class JoinHintSuite extends PlanTest with SharedSparkSession with AdaptiveSparkP
         msgJoinHintOverridden("shuffle_hash") :: Nil
     )
   }
+  */
 
+  /* Remark log4j1 unit test
   test("hint merge - SQL") {
     withTempView("a", "b", "c") {
       df1.createOrReplaceTempView("a")
@@ -299,6 +304,7 @@ class JoinHintSuite extends PlanTest with SharedSparkSession with AdaptiveSparkP
       )
     }
   }
+  */
 
   test("nested hint") {
     verifyJoinHint(
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/SparkSessionBuilderSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/SparkSessionBuilderSuite.scala
index 1f16bb69b..9db9966b7 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/SparkSessionBuilderSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/SparkSessionBuilderSuite.scala
@@ -387,6 +387,7 @@ class SparkSessionBuilderSuite extends SparkFunSuite with BeforeAndAfterEach {
 
   }
 
+  /* Remark log4j1 unit test
   test("SPARK-33944: warning setting hive.metastore.warehouse.dir using session options") {
     val msg = "Not allowing to set hive.metastore.warehouse.dir in SparkSession's options"
     val logAppender = new LogAppender(msg)
@@ -399,7 +400,9 @@ class SparkSessionBuilderSuite extends SparkFunSuite with BeforeAndAfterEach {
     }
     assert(logAppender.loggingEvents.exists(_.getRenderedMessage.contains(msg)))
   }
+  */
 
+  /* Remark log4j1 unit test
   test("SPARK-33944: no warning setting spark.sql.warehouse.dir using session options") {
     val msg = "Not allowing to set hive.metastore.warehouse.dir in SparkSession's options"
     val logAppender = new LogAppender(msg)
@@ -412,4 +415,5 @@ class SparkSessionBuilderSuite extends SparkFunSuite with BeforeAndAfterEach {
     }
     assert(!logAppender.loggingEvents.exists(_.getRenderedMessage.contains(msg)))
   }
+  */
 }
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
index d0839d484..4595ed628 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
@@ -21,7 +21,7 @@ import java.io.File
 import java.net.URI
 
 import com.intel.oap.execution.{ColumnarBroadcastHashJoinExec, ColumnarSortMergeJoinExec}
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerJobStart}
 import org.apache.spark.sql.{Dataset, QueryTest, Row, SparkSession, Strategy}
 import org.apache.spark.sql.catalyst.optimizer.{BuildLeft, BuildRight}
@@ -797,6 +797,7 @@ class AdaptiveQueryExecSuite
     }
   }
 
+  /* Remark log4j1 unit test
   test("SPARK-30719: do not log warning if intentionally skip AQE") {
     val testAppender = new LogAppender("aqe logging warning test when skip")
     withLogAppender(testAppender) {
@@ -811,7 +812,9 @@ class AdaptiveQueryExecSuite
         s"${SQLConf.ADAPTIVE_EXECUTION_ENABLED.key} is" +
         s" enabled but is not supported for")))
   }
+  */
 
+  /* Remark log4j1 unit test
   test("test log level") {
     def verifyLog(expectedLevel: Level): Unit = {
       val logAppender = new LogAppender("adaptive execution")
@@ -856,6 +859,7 @@ class AdaptiveQueryExecSuite
       }
     }
   }
+  */
 
   test("tree string output") {
     withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true") {
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/ColumnarAdaptiveQueryExecSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/ColumnarAdaptiveQueryExecSuite.scala
index addb95dbf..ee92b78a3 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/ColumnarAdaptiveQueryExecSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/adaptive/ColumnarAdaptiveQueryExecSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.execution.adaptive
 import java.io.File
 import java.net.URI
 
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 import org.apache.spark.SparkConf
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerJobStart}
 import org.apache.spark.sql.{Dataset, QueryTest, Row, SparkSession, Strategy}
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
index 30f0e45d0..c15f6f0d7 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
@@ -1780,6 +1780,7 @@ abstract class CSVSuite
     assert(exception.getMessage.contains("CSV header does not conform to the schema"))
   }
 
+  /* Remark log4j1 unit test
   test("SPARK-23786: warning should be printed if CSV header doesn't conform to schema") {
     val testAppender1 = new LogAppender("CSV header matches to schema")
     withLogAppender(testAppender1) {
@@ -1809,6 +1810,7 @@ abstract class CSVSuite
     assert(testAppender2.loggingEvents
       .exists(msg => msg.getRenderedMessage.contains("CSV header does not conform to the schema")))
   }
+  */
 
   test("SPARK-25134: check header on parsing of dataset with projection and column pruning") {
     withSQLConf(SQLConf.CSV_PARSER_COLUMN_PRUNING.key -> "true") {
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalogSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalogSuite.scala
index c03768d8e..dee37058a 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalogSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalogSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.datasources.v2.jdbc
 import java.sql.{Connection, DriverManager}
 import java.util.Properties
 
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
@@ -391,6 +391,7 @@ class JDBCTableCatalogSuite extends QueryTest with SharedSparkSession {
     }
   }
 
+  /* Remark log4j1 unit test
   test("CREATE TABLE with table comment") {
     withTable("h2.test.new_table") {
       val logAppender = new LogAppender("table comment")
@@ -404,6 +405,7 @@ class JDBCTableCatalogSuite extends QueryTest with SharedSparkSession {
       assert(createCommentWarning === false)
     }
   }
+  */
 
   test("CREATE TABLE with table property") {
     withTable("h2.test.new_table") {
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/internal/SQLConfSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/internal/SQLConfSuite.scala
index 1ea2d4fd0..4780b9a96 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/internal/SQLConfSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/internal/SQLConfSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.internal
 import java.util.TimeZone
 
 import org.apache.hadoop.fs.Path
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.parser.ParseException
@@ -387,6 +387,7 @@ class SQLConfSuite extends QueryTest with SharedSparkSession {
     assert(e.getMessage.contains(config))
   }
 
+  /* Remark log4j1 unit test
   test("log deprecation warnings") {
     val logAppender = new LogAppender("deprecated SQL configs")
     def check(config: String): Unit = {
@@ -407,6 +408,7 @@ class SQLConfSuite extends QueryTest with SharedSparkSession {
     }
     check(config2)
   }
+  */
 
   test("spark.sql.session.timeZone should only accept valid zone id") {
     spark.conf.set(SQLConf.SESSION_LOCAL_TIMEZONE.key, MIT.getId)
diff --git a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/nativesql/NativeColumnarAdaptiveQueryExecSuite.scala b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/nativesql/NativeColumnarAdaptiveQueryExecSuite.scala
index 5f7412a42..9875d9978 100644
--- a/native-sql-engine/core/src/test/scala/org/apache/spark/sql/nativesql/NativeColumnarAdaptiveQueryExecSuite.scala
+++ b/native-sql-engine/core/src/test/scala/org/apache/spark/sql/nativesql/NativeColumnarAdaptiveQueryExecSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.nativesql
 import java.io.File
 import java.net.URI
 
-import org.apache.log4j.Level
+//import org.apache.log4j.Level
 import org.apache.spark.SparkConf
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerJobStart}
 import org.apache.spark.sql.{Dataset, QueryTest, Row, SparkSession, Strategy}
diff --git a/native-sql-engine/cpp/src/CMakeLists.txt b/native-sql-engine/cpp/src/CMakeLists.txt
index 9aeac55e1..7681ea973 100644
--- a/native-sql-engine/cpp/src/CMakeLists.txt
+++ b/native-sql-engine/cpp/src/CMakeLists.txt
@@ -140,7 +140,7 @@ macro(build_arrow STATIC_ARROW)
   ExternalProject_Add(arrow_ep
                       GIT_REPOSITORY https://github.com/oap-project/arrow.git
                       SOURCE_DIR ${ARROW_SOURCE_DIR}
-                      GIT_TAG arrow-4.0.0-oap
+                      GIT_TAG arrow-4.0.0-oap-1.3
                       BUILD_IN_SOURCE 1
                       INSTALL_DIR ${ARROW_PREFIX}
                       INSTALL_COMMAND make install
@@ -304,11 +304,13 @@ macro(find_arrow)
     file(COPY ${ARROW_BFS_INCLUDE_DIR}/arrow DESTINATION ${root_directory}/releases/include)
     file(COPY ${ARROW_BFS_INCLUDE_DIR}/gandiva DESTINATION ${root_directory}/releases/include)
     file(COPY ${ARROW_BFS_INCLUDE_DIR}/parquet DESTINATION ${root_directory}/releases/include)
+    file(COPY ${ARROW_BFS_INCLUDE_DIR}/re2 DESTINATION ${root_directory}/releases/include)
   else()
     message(STATUS "COPY and Set Arrow Header to: ${ARROW_INCLUDE_DIR}")
     file(COPY ${ARROW_INCLUDE_DIR}/arrow DESTINATION ${root_directory}/releases/include)
     file(COPY ${ARROW_INCLUDE_DIR}/gandiva DESTINATION ${root_directory}/releases/include)
     file(COPY ${ARROW_INCLUDE_DIR}/parquet DESTINATION ${root_directory}/releases/include)
+    file(COPY ${ARROW_INCLUDE_DIR}/re2 DESTINATION ${root_directory}/releases/include)
   endif()
 
   # Set up Arrow Shared Library Directory
diff --git a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/expression_codegen_visitor.cc b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/expression_codegen_visitor.cc
index d3df9dfa9..b4a807289 100644
--- a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/expression_codegen_visitor.cc
+++ b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/expression_codegen_visitor.cc
@@ -100,7 +100,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
       prepare_str_ += child_visitor_list[i]->GetPrepare();
     }
     codes_str_ = ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("greater_than") == 0) {
     real_codes_str_ = "(" + child_visitor_list[0]->GetResult() + " > " +
                       child_visitor_list[1]->GetResult() + ")";
@@ -123,7 +122,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
       prepare_str_ += child_visitor_list[i]->GetPrepare();
     }
     codes_str_ = ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("less_than_or_equal_to") == 0) {
     real_codes_str_ = "(" + child_visitor_list[0]->GetResult() +
                       " <= " + child_visitor_list[1]->GetResult() + ")";
@@ -147,7 +145,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
       prepare_str_ += child_visitor_list[i]->GetPrepare();
     }
     codes_str_ = ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("greater_than_or_equal_to") == 0) {
     real_codes_str_ = "(" + child_visitor_list[0]->GetResult() +
                       " >= " + child_visitor_list[1]->GetResult() + ")";
@@ -171,7 +168,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
       prepare_str_ += child_visitor_list[i]->GetPrepare();
     }
     codes_str_ = ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("equal") == 0) {
     real_codes_str_ = "(" + child_visitor_list[0]->GetResult() +
                       " == " + child_visitor_list[1]->GetResult() + ")";
@@ -194,7 +190,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
       prepare_str_ += child_visitor_list[i]->GetPrepare();
     }
     codes_str_ = ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("not") == 0) {
     std::string check_validity;
     if (child_visitor_list[0]->GetPreCheck() != "") {
@@ -246,6 +241,26 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
                << ".rfind(" << child_visitor_list[1]->GetResult()
                << ") != std::string::npos;";
     prepare_str_ += prepare_ss.str();
+  } else if (func_name.compare("like") == 0) {
+    codes_str_ = func_name + "_" + std::to_string(cur_func_id);
+    auto validity = codes_str_ + "_validity";
+    real_codes_str_ = codes_str_;
+    real_validity_str_ = validity;
+    std::stringstream prepare_ss;
+    prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
+               << std::endl;
+    prepare_ss << "bool " << validity << " = " << child_visitor_list[0]->GetPreCheck()
+               << ";" << std::endl;
+    prepare_ss << "if (" << validity << ") {" << std::endl;
+    prepare_ss << codes_str_ << " = like"
+               << "(" << child_visitor_list[0]->GetResult() << ", "
+               << child_visitor_list[1]->GetResult() << ");" << std::endl;
+    prepare_ss << "}" << std::endl;
+    for (int i = 0; i < 1; i++) {
+      prepare_str_ += child_visitor_list[i]->GetPrepare();
+    }
+    prepare_str_ += prepare_ss.str();
+    check_str_ = validity;
   } else if (func_name.compare("get_json_object") == 0) {
     for (int i = 0; i < 2; i++) {
       prepare_str_ += child_visitor_list[i]->GetPrepare();
@@ -255,12 +270,18 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     real_codes_str_ = codes_str_;
     real_validity_str_ = check_str_;
     std::stringstream prepare_ss;
-    prepare_ss << "bool " << check_str_ << " = true;" << std::endl;
-    prepare_ss << "std::string " << codes_str_ << " = get_json_object("
+    auto validity = codes_str_ + "_validity";
+    prepare_ss << "std::string " << codes_str_ << ";" << std::endl;
+    prepare_ss << "bool " << validity << " = " << child_visitor_list[0]->GetPreCheck()
+               << ";" << std::endl;
+    prepare_ss << "if (" << validity << ") {" << std::endl;
+    prepare_ss << codes_str_ << " = get_json_object("
                << child_visitor_list[0]->GetResult() << ", "
-               << child_visitor_list[1]->GetResult() << ");\n";
+               << child_visitor_list[1]->GetResult() << ", "
+               << "&" << validity << ");\n";
+    prepare_ss << "}" << std::endl;
     prepare_str_ += prepare_ss.str();
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
+    check_str_ = validity;
   } else if (func_name.compare("substr") == 0) {
     ss << child_visitor_list[0]->GetResult() << ".substr("
        << "((" << child_visitor_list[1]->GetResult() << " - 1) < 0 ? 0 : ("
@@ -282,6 +303,37 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     prepare_ss << "if (" << check_str_ << ")" << std::endl;
     prepare_ss << codes_str_ << " = " << ss.str() << ";" << std::endl;
     prepare_str_ += prepare_ss.str();
+  } else if (func_name.compare("btrim") == 0) {
+    codes_str_ = func_name + "_" + std::to_string(cur_func_id);
+    auto validity = codes_str_ + "_validity";
+    real_codes_str_ = codes_str_;
+    real_validity_str_ = validity;
+    std::stringstream prepare_ss;
+    prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
+               << std::endl;
+    prepare_ss << "bool " << validity << " = " << child_visitor_list[0]->GetPreCheck()
+               << ";" << std::endl;
+    prepare_ss << "if (" << validity << ") {" << std::endl;
+    prepare_ss << "std::string arg = " << child_visitor_list[0]->GetResult() << ";"
+               << std::endl;
+    prepare_ss << "int start_index = 0, end_index = arg.length() - 1;" << std::endl;
+    prepare_ss << "while (start_index <= end_index && arg[start_index] == ' ') {"
+               << std::endl;
+    prepare_ss << "start_index++;" << std::endl;
+    prepare_ss << "}" << std::endl;
+    prepare_ss << "while (end_index >= start_index && arg[end_index] == ' ') {"
+               << std::endl;
+    prepare_ss << "end_index--;" << std::endl;
+    prepare_ss << "}" << std::endl;
+    prepare_ss << codes_str_ << " = arg.substr(start_index, end_index - start_index + 1);"
+               << std::endl;
+    prepare_ss << "}" << std::endl;
+    for (int i = 0; i < 1; i++) {
+      prepare_str_ += child_visitor_list[i]->GetPrepare();
+    }
+    prepare_str_ += prepare_ss.str();
+    check_str_ = validity;
+
   } else if (func_name.compare("upper") == 0) {
     std::stringstream prepare_ss;
     auto child_name = child_visitor_list[0]->GetResult();
@@ -377,7 +429,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
                    << child_visitor_list[0]->GetResult() << ", " << decimal_type->scale()
                    << "));" << std::endl;
       }
-      header_list_.push_back(R"(#include "precompile/gandiva.h")");
     }
     prepare_ss << "}" << std::endl;
 
@@ -439,7 +490,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("castDECIMAL") == 0) {
     codes_str_ = func_name + "_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
@@ -474,7 +524,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("castDECIMALNullOnOverflow") == 0) {
     codes_str_ = func_name + "_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
@@ -506,7 +555,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("castINTOrNull") == 0 ||
              func_name.compare("castBIGINTOrNull") == 0 ||
              func_name.compare("castFLOAT4OrNull") == 0 ||
@@ -532,8 +580,12 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     } else {
       func_str = " = std::stod";
     }
+    prepare_ss << "try {" << std::endl;
     prepare_ss << codes_str_ << func_str << "(" << child_visitor_list[0]->GetResult()
                << ");" << std::endl;
+    prepare_ss << "} catch (std::invalid_argument) {" << std::endl;
+    prepare_ss << validity << " = false;" << std::endl;
+    prepare_ss << "}" << std::endl;
     prepare_ss << "}" << std::endl;
 
     for (int i = 0; i < 1; i++) {
@@ -569,7 +621,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("extractYear") == 0) {
     codes_str_ = func_name + "_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
@@ -590,7 +641,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("round") == 0) {
     codes_str_ = func_name + "_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
@@ -629,7 +679,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
 
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("abs") == 0) {
     codes_str_ = "abs_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
@@ -677,7 +726,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
              << child_visitor_list[1]->GetResult() << ", " << rightType->precision()
              << ", " << rightType->scale() << ", " << resType->precision() << ", "
              << resType->scale() << ")";
-      header_list_.push_back(R"(#include "precompile/gandiva.h")");
     }
     std::stringstream prepare_ss;
     prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
@@ -717,7 +765,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
              << child_visitor_list[1]->GetResult() << ", " << rightType->precision()
              << ", " << rightType->scale() << ", " << resType->precision() << ", "
              << resType->scale() << ")";
-      header_list_.push_back(R"(#include "precompile/gandiva.h")");
     }
     std::stringstream prepare_ss;
     prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
@@ -757,7 +804,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
              << child_visitor_list[1]->GetResult() << ", " << rightType->precision()
              << ", " << rightType->scale() << ", " << resType->precision() << ", "
              << resType->scale() << ", &overflow)";
-      header_list_.push_back(R"(#include "precompile/gandiva.h")");
     }
     std::stringstream prepare_ss;
     prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
@@ -803,7 +849,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
              << child_visitor_list[1]->GetResult() << ", " << rightType->precision()
              << ", " << rightType->scale() << ", " << resType->precision() << ", "
              << resType->scale() << ", &overflow)";
-      header_list_.push_back(R"(#include "precompile/gandiva.h")");
     }
     std::stringstream prepare_ss;
     prepare_ss << GetCTypeString(node.return_type()) << " " << codes_str_ << ";"
@@ -937,7 +982,6 @@ arrow::Status ExpressionCodegenVisitor::Visit(const gandiva::FunctionNode& node)
     }
     prepare_str_ += prepare_ss.str();
     check_str_ = validity;
-    header_list_.push_back(R"(#include "precompile/gandiva.h")");
   } else if (func_name.compare("convertTimestampUnit") == 0) {
     codes_str_ = "convertTimestampUnit_" + std::to_string(cur_func_id);
     auto validity = codes_str_ + "_validity";
diff --git a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/kernels_ext.h b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/kernels_ext.h
index ffa15f792..520f4b60f 100644
--- a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/kernels_ext.h
+++ b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/kernels_ext.h
@@ -173,6 +173,11 @@ class WindowAggregateFunctionKernel : public KernalBase {
                                       arrow::Result<std::shared_ptr<BuilderType>>>
   createBuilder(std::shared_ptr<arrow::DataType> data_type);
 
+  template <typename ValueType, typename BuilderType>
+  typename arrow::enable_if_string_like<ValueType,
+                                        arrow::Result<std::shared_ptr<BuilderType>>>
+  createBuilder(std::shared_ptr<arrow::DataType> data_type);
+
   arrow::compute::ExecContext* ctx_ = nullptr;
   std::shared_ptr<ActionFactory> action_;
   std::vector<std::shared_ptr<arrow::Int32Array>> accumulated_group_ids_;
diff --git a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/whole_stage_codegen_kernel.cc b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/whole_stage_codegen_kernel.cc
index b0d575c10..0e0f6a8a7 100644
--- a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/whole_stage_codegen_kernel.cc
+++ b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/whole_stage_codegen_kernel.cc
@@ -330,7 +330,7 @@ class WholeStageCodeGenKernel::Impl {
     }
 
     codes_ss << R"(
-using namespace sparkcolumnarplugin::precompile;
+
 class TypedWholeStageCodeGenImpl : public CodeGenBase {
  public:
   TypedWholeStageCodeGenImpl(arrow::compute::ExecContext *ctx) : ctx_(ctx) {}
diff --git a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/window_kernel.cc b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/window_kernel.cc
index edc1dfad7..3423c8c81 100644
--- a/native-sql-engine/cpp/src/codegen/arrow_compute/ext/window_kernel.cc
+++ b/native-sql-engine/cpp/src/codegen/arrow_compute/ext/window_kernel.cc
@@ -154,6 +154,7 @@ arrow::Status WindowAggregateFunctionKernel::Evaluate(ArrayList& in) {
   PROC(arrow::FloatType, arrow::FloatBuilder, arrow::FloatArray)             \
   PROC(arrow::DoubleType, arrow::DoubleBuilder, arrow::DoubleArray)          \
   PROC(arrow::Date32Type, arrow::Date32Builder, arrow::Date32Array)          \
+  PROC(arrow::StringType, arrow::StringBuilder, arrow::StringArray)          \
   PROC(arrow::TimestampType, arrow::TimestampBuilder, arrow::TimestampArray) \
   PROC(arrow::Decimal128Type, arrow::Decimal128Builder, arrow::Decimal128Array)
 
@@ -232,6 +233,13 @@ WindowAggregateFunctionKernel::createBuilder(std::shared_ptr<arrow::DataType> da
   return std::make_shared<BuilderType>(data_type, ctx_->memory_pool());
 }
 
+template <typename ValueType, typename BuilderType>
+typename arrow::enable_if_string_like<ValueType,
+                                      arrow::Result<std::shared_ptr<BuilderType>>>
+WindowAggregateFunctionKernel::createBuilder(std::shared_ptr<arrow::DataType> data_type) {
+  return std::make_shared<BuilderType>(data_type, ctx_->memory_pool());
+}
+
 WindowRankKernel::WindowRankKernel(
     arrow::compute::ExecContext* ctx,
     std::vector<std::shared_ptr<arrow::DataType>> type_list,
diff --git a/native-sql-engine/cpp/src/jni/jni_wrapper.cc b/native-sql-engine/cpp/src/jni/jni_wrapper.cc
index a000a8af3..f82068c37 100644
--- a/native-sql-engine/cpp/src/jni/jni_wrapper.cc
+++ b/native-sql-engine/cpp/src/jni/jni_wrapper.cc
@@ -1026,9 +1026,9 @@ JNIEXPORT jlong JNICALL
 Java_com_intel_oap_vectorized_ShuffleSplitterJniWrapper_nativeMake(
     JNIEnv* env, jobject, jstring partitioning_name_jstr, jint num_partitions,
     jbyteArray schema_arr, jbyteArray expr_arr, jlong offheap_per_task, jint buffer_size,
-    jstring compression_type_jstr, jstring data_file_jstr, jint num_sub_dirs,
-    jstring local_dirs_jstr, jboolean prefer_spill, jlong memory_pool_id,
-    jboolean write_schema) {
+    jstring compression_type_jstr, jint batch_compress_threshold, jstring data_file_jstr,
+    jint num_sub_dirs, jstring local_dirs_jstr, jboolean prefer_spill,
+    jlong memory_pool_id, jboolean write_schema) {
   JNI_METHOD_START
   if (partitioning_name_jstr == NULL) {
     JniThrow(std::string("Short partitioning name can't be null"));
@@ -1114,6 +1114,7 @@ Java_com_intel_oap_vectorized_ShuffleSplitterJniWrapper_nativeMake(
     jlong attmpt_id = env->CallLongMethod(tc_obj, get_tsk_attmpt_mid);
     splitOptions.task_attempt_id = (int64_t)attmpt_id;
   }
+  splitOptions.batch_compress_threshold = batch_compress_threshold;
 
   auto splitter =
       JniGetOrThrow(Splitter::Make(partitioning_name, std::move(schema), num_partitions,
diff --git a/native-sql-engine/cpp/src/precompile/gandiva.h b/native-sql-engine/cpp/src/precompile/gandiva.h
index 6d49c0056..d722f799d 100644
--- a/native-sql-engine/cpp/src/precompile/gandiva.h
+++ b/native-sql-engine/cpp/src/precompile/gandiva.h
@@ -21,8 +21,10 @@
 #include <arrow/json/parser.h>
 #include <arrow/util/decimal.h>
 #include <math.h>
+#include <re2/re2.h>
 
 #include <cstdint>
+#include <set>
 #include <type_traits>
 
 #include "third_party/gandiva/decimal_ops.h"
@@ -230,7 +232,8 @@ arrow::Decimal128 round(arrow::Decimal128 in, int32_t original_precision,
   return arrow::Decimal128(out);
 }
 
-std::string get_json_object(const std::string& json_str, const std::string& json_path) {
+std::string get_json_object(const std::string& json_str, const std::string& json_path,
+                            bool* validity) {
   std::unique_ptr<arrow::json::BlockParser> parser;
   (arrow::json::BlockParser::Make(arrow::json::ParseOptions::Defaults(), &parser));
   (parser->Parse(std::make_shared<arrow::Buffer>(json_str)));
@@ -239,18 +242,21 @@ std::string get_json_object(const std::string& json_str, const std::string& json
   auto struct_parsed = std::dynamic_pointer_cast<arrow::StructArray>(parsed);
   // json_path example: $.col_14, will extract col_14 here
   if (json_path.length() < 3) {
-    return nullptr;
+    *validity = false;
+    return "";
   }
   auto col_name = json_path.substr(2);
   // illegal json string.
   if (struct_parsed == nullptr) {
-    return nullptr;
+    *validity = false;
+    return "";
   }
   auto dict_parsed = std::dynamic_pointer_cast<arrow::DictionaryArray>(
       struct_parsed->GetFieldByName(col_name));
   // no data contained for given field.
   if (dict_parsed == nullptr) {
-    return nullptr;
+    *validity = false;
+    return "";
   }
 
   auto dict_array = dict_parsed->dictionary();
@@ -258,8 +264,54 @@ std::string get_json_object(const std::string& json_str, const std::string& json
   auto res_index = dict_parsed->GetValueIndex(0);
   // TODO(): check null results
   auto utf8_array = std::dynamic_pointer_cast<arrow::BinaryArray>(dict_array);
-
   auto res = utf8_array->GetString(res_index);
-
+  *validity = true;
   return res;
+}
+
+// Reused the code in gandiva LikeHolder.cc
+std::string SqlLikePatternToPcre(const std::string& sql_pattern, char escape_char) {
+  const std::set<char> pcre_regex_specials_ = {'[', ']', '(', ')', '|', '^',  '-', '+',
+                                               '*', '?', '{', '}', '$', '\\', '.'};
+  /// Characters that are considered special by pcre regex. These needs to be
+  /// escaped with '\\'.
+  std::string pcre_pattern;
+  for (size_t idx = 0; idx < sql_pattern.size(); ++idx) {
+    auto cur = sql_pattern.at(idx);
+
+    // Escape any char that is special for pcre regex
+    if (pcre_regex_specials_.find(cur) != pcre_regex_specials_.end()) {
+      pcre_pattern += "\\";
+    }
+
+    if (cur == escape_char) {
+      // escape char must be followed by '_', '%' or the escape char itself.
+      ++idx;
+      if (idx == sql_pattern.size()) {
+        throw std::runtime_error("Unexpected escape char at the end of pattern " +
+                                 sql_pattern);
+      }
+
+      cur = sql_pattern.at(idx);
+      if (cur == '_' || cur == '%' || cur == escape_char) {
+        pcre_pattern += cur;
+      } else {
+        throw std::runtime_error("Invalid escape sequence in pattern " + sql_pattern);
+      }
+    } else if (cur == '_') {
+      pcre_pattern += '.';
+    } else if (cur == '%') {
+      pcre_pattern += ".*";
+    } else {
+      pcre_pattern += cur;
+    }
+  }
+  return pcre_pattern;
+}
+
+// Currently, escape char is not supported.
+bool like(const std::string& data, const std::string& pattern) {
+  std::string pcre_pattern = SqlLikePatternToPcre(pattern, 0);
+  RE2 regex(pcre_pattern);
+  return RE2::FullMatch(data, regex);
 }
\ No newline at end of file
diff --git a/native-sql-engine/cpp/src/shuffle/splitter.cc b/native-sql-engine/cpp/src/shuffle/splitter.cc
index 44f21567b..d58f0605d 100644
--- a/native-sql-engine/cpp/src/shuffle/splitter.cc
+++ b/native-sql-engine/cpp/src/shuffle/splitter.cc
@@ -361,15 +361,45 @@ arrow::Status Splitter::Init() {
                                                        arrow::Compression::UNCOMPRESSED));
   }
 
+  // initialize tiny batch write options
+  tiny_bach_write_options_ = ipc_write_options;
+  ARROW_ASSIGN_OR_RAISE(
+      tiny_bach_write_options_.codec,
+      arrow::util::Codec::CreateInt32(arrow::Compression::UNCOMPRESSED));
+
   return arrow::Status::OK();
 }
 
+int64_t batch_nbytes(const arrow::RecordBatch& batch) {
+  int64_t accumulated = 0L;
+  for (const auto& array : batch.columns()) {
+    if (array == nullptr || array->data() == nullptr) {
+      continue;
+    }
+    for (const auto& buf : array->data()->buffers) {
+      if (buf == nullptr) {
+        continue;
+      }
+      accumulated += buf->capacity();
+    }
+  }
+  return accumulated;
+}
+
+int64_t batch_nbytes(std::shared_ptr<arrow::RecordBatch> batch) {
+  if (batch == nullptr) {
+    return 0;
+  }
+  return batch_nbytes(*batch);
+}
+
 int64_t Splitter::CompressedSize(const arrow::RecordBatch& rb) {
   auto payload = std::make_shared<arrow::ipc::IpcPayload>();
-  auto result =
+  arrow::Status result;
+  result =
       arrow::ipc::GetRecordBatchPayload(rb, options_.ipc_write_options, payload.get());
   if (result.ok()) {
-    return payload.get()->body_length;
+    return payload->body_length;
   } else {
     result.UnknownError("Failed to get the compressed size.");
     return -1;
@@ -433,25 +463,6 @@ arrow::Status Splitter::Stop() {
   return arrow::Status::OK();
 }
 
-int64_t batch_nbytes(std::shared_ptr<arrow::RecordBatch> batch) {
-  int64_t accumulated = 0L;
-  if (batch == nullptr) {
-    return accumulated;
-  }
-  for (const auto& array : batch->columns()) {
-    if (array == nullptr || array->data() == nullptr) {
-      continue;
-    }
-    for (const auto& buf : array->data()->buffers) {
-      if (buf == nullptr) {
-        continue;
-      }
-      accumulated += buf->capacity();
-    }
-  }
-  return accumulated;
-}
-
 arrow::Status Splitter::CacheRecordBatch(int32_t partition_id, bool reset_buffers) {
   if (partition_buffer_idx_base_[partition_id] > 0) {
     auto fixed_width_idx = 0;
@@ -549,12 +560,18 @@ arrow::Status Splitter::CacheRecordBatch(int32_t partition_id, bool reset_buffer
       }
     }
     auto batch = arrow::RecordBatch::Make(schema_, num_rows, std::move(arrays));
-
+    int64_t raw_size = batch_nbytes(batch);
+    raw_partition_lengths_[partition_id] += raw_size;
     auto payload = std::make_shared<arrow::ipc::IpcPayload>();
-    TIME_NANO_OR_RAISE(total_compress_time_,
-                       arrow::ipc::GetRecordBatchPayload(
-                           *batch, options_.ipc_write_options, payload.get()));
-    raw_partition_lengths_[partition_id] += batch_nbytes(batch);
+    if (num_rows <= options_.batch_compress_threshold) {
+      TIME_NANO_OR_RAISE(total_compress_time_,
+                         arrow::ipc::GetRecordBatchPayload(
+                             *batch, tiny_bach_write_options_, payload.get()));
+    } else {
+      TIME_NANO_OR_RAISE(total_compress_time_,
+                         arrow::ipc::GetRecordBatchPayload(
+                             *batch, options_.ipc_write_options, payload.get()));
+    }
     partition_cached_recordbatch_size_[partition_id] += payload->body_length;
     partition_cached_recordbatch_[partition_id].push_back(std::move(payload));
     partition_buffer_idx_base_[partition_id] = 0;
diff --git a/native-sql-engine/cpp/src/shuffle/splitter.h b/native-sql-engine/cpp/src/shuffle/splitter.h
index 1bdd6aa50..dbf07aa87 100644
--- a/native-sql-engine/cpp/src/shuffle/splitter.h
+++ b/native-sql-engine/cpp/src/shuffle/splitter.h
@@ -209,6 +209,9 @@ class Splitter {
   std::shared_ptr<arrow::Schema> schema_;
   SplitOptions options_;
 
+  // write options for tiny batches
+  arrow::ipc::IpcWriteOptions tiny_bach_write_options_;
+
   int64_t total_bytes_written_ = 0;
   int64_t total_bytes_spilled_ = 0;
   int64_t total_write_time_ = 0;
diff --git a/native-sql-engine/cpp/src/shuffle/type.h b/native-sql-engine/cpp/src/shuffle/type.h
index f7d43ca69..e73974243 100644
--- a/native-sql-engine/cpp/src/shuffle/type.h
+++ b/native-sql-engine/cpp/src/shuffle/type.h
@@ -29,6 +29,7 @@ namespace shuffle {
 
 static constexpr int32_t kDefaultSplitterBufferSize = 4096;
 static constexpr int32_t kDefaultNumSubDirs = 64;
+static constexpr int32_t kDefaultBatchCompressThreshold = 256;
 
 // This 0xFFFFFFFF value is the first 4 bytes of a valid IPC message
 static constexpr int32_t kIpcContinuationToken = -1;
@@ -39,6 +40,7 @@ struct SplitOptions {
   int64_t offheap_per_task = 0;
   int32_t buffer_size = kDefaultSplitterBufferSize;
   int32_t num_sub_dirs = kDefaultNumSubDirs;
+  int32_t batch_compress_threshold = kDefaultBatchCompressThreshold;
   arrow::Compression::type compression_type = arrow::Compression::UNCOMPRESSED;
   bool prefer_spill = true;
   bool write_schema = true;
diff --git a/native-sql-engine/cpp/src/tests/arrow_compute_test_precompile.cc b/native-sql-engine/cpp/src/tests/arrow_compute_test_precompile.cc
index dbd996a8a..a596c9f3f 100644
--- a/native-sql-engine/cpp/src/tests/arrow_compute_test_precompile.cc
+++ b/native-sql-engine/cpp/src/tests/arrow_compute_test_precompile.cc
@@ -111,9 +111,33 @@ TEST(TestArrowCompute, ArithmeticComparisonTest) {
   ASSERT_EQ(res, true);
 }
 
+TEST(TestArrowCompute, LikeTest) {
+  std::string sql_pattern = "ab%";
+  EXPECT_TRUE(like("ab", sql_pattern));
+  EXPECT_TRUE(like("abc", sql_pattern));
+  EXPECT_TRUE(like("abcd", sql_pattern));
+  EXPECT_FALSE(like("a", sql_pattern));
+  EXPECT_FALSE(like("cab", sql_pattern));
+
+  sql_pattern = "%ab%";
+  EXPECT_TRUE(like("ab", sql_pattern));
+  EXPECT_TRUE(like("abcd", sql_pattern));
+  EXPECT_TRUE(like("cdab", sql_pattern));
+  EXPECT_TRUE(like("xxabxx", sql_pattern));
+}
+
 TEST(TestArrowCompute, JsonTest) {
-  std::string data = get_json_object(R"({"hello": "3.5"})", "$.hello");
+  bool validity;
+  std::string data = get_json_object(R"({"hello": "3.5"})", "$.hello", &validity);
   EXPECT_EQ(data, "3.5");
+  EXPECT_EQ(validity, true);
+
+  data = get_json_object(R"({"hello": ""})", "$.hello", &validity);
+  EXPECT_EQ(data, "");
+  EXPECT_EQ(validity, true);
+
+  data = get_json_object(R"({"hello": "3.5"})", "$.hi", &validity);
+  EXPECT_EQ(validity, false);
 }
 
 }  // namespace codegen