fix ut

apache · Aug 26, 2024 · f0848ad · f0848ad
1 parent 6815f08
commit f0848ad
Show file tree

Hide file tree

Showing 17 changed files with 366 additions and 284 deletions.
diff --git a/backends-clickhouse/src/main/scala/org/apache/gluten/backendsapi/clickhouse/CHBackend.scala b/backends-clickhouse/src/main/scala/org/apache/gluten/backendsapi/clickhouse/CHBackend.scala
@@ -405,4 +405,6 @@ object CHBackendSettings extends BackendSettingsApi with Logging {
         }
       }
   }
+
+  override def supportNativeInputFileRelatedExpr(): Boolean = true
 }
diff --git a/...ds-clickhouse/src/main/scala/org/apache/gluten/backendsapi/clickhouse/CHIteratorApi.scala b/...ds-clickhouse/src/main/scala/org/apache/gluten/backendsapi/clickhouse/CHIteratorApi.scala
@@ -33,6 +33,7 @@ import org.apache.spark.{InterruptibleIterator, SparkConf, TaskContext}
 import org.apache.spark.affinity.CHAffinity
 import org.apache.spark.executor.InputMetrics
 import org.apache.spark.internal.Logging
+import org.apache.spark.shuffle.CHColumnarShuffleWriter
 import org.apache.spark.sql.connector.read.InputPartition
 import org.apache.spark.sql.execution.datasources.FilePartition
 import org.apache.spark.sql.execution.metric.SQLMetric
@@ -322,8 +323,10 @@ class CollectMetricIterator(
   private var outputRowCount = 0L
   private var outputVectorCount = 0L
   private var metricsUpdated = false
+  private var wholeStagePipeline = true
 
   override def hasNext: Boolean = {
+    wholeStagePipeline = false
     nativeIterator.hasNext
   }
 
@@ -347,6 +350,11 @@ class CollectMetricIterator(
   private def collectStageMetrics(): Unit = {
     if (!metricsUpdated) {
       val nativeMetrics = nativeIterator.getMetrics.asInstanceOf[NativeMetrics]
+      if (wholeStagePipeline) {
+        outputRowCount = Math.max(outputRowCount, CHColumnarShuffleWriter.getTotalOutputRows())
+        outputVectorCount =
+          Math.max(outputVectorCount, CHColumnarShuffleWriter.getTotalOutputBatches())
+      }
       nativeMetrics.setFinalOutputMetrics(outputRowCount, outputVectorCount)
       updateNativeMetrics(nativeMetrics)
       updateInputMetrics.foreach(_(inputMetrics))

diff --git a/backends-clickhouse/src/main/scala/org/apache/spark/shuffle/CHColumnarShuffleWriter.scala b/backends-clickhouse/src/main/scala/org/apache/spark/shuffle/CHColumnarShuffleWriter.scala
@@ -22,7 +22,7 @@ import org.apache.gluten.execution.ColumnarNativeIterator
 import org.apache.gluten.memory.CHThreadGroup
 import org.apache.gluten.vectorized._
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.internal.Logging
 import org.apache.spark.scheduler.MapStatus
 import org.apache.spark.sql.vectorized.ColumnarBatch
@@ -134,7 +134,7 @@ class CHColumnarShuffleWriter[K, V](
       writeMetrics.incWriteTime(splitResult.getTotalWriteTime + splitResult.getTotalSpillTime)
       partitionLengths = splitResult.getPartitionLengths
       rawPartitionLengths = splitResult.getRawPartitionLengths
-
+      CHColumnarShuffleWriter.setOutputMetrics(splitResult)
       try {
         shuffleBlockResolver.writeMetadataFileAndCommit(
           dep.shuffleId,
@@ -188,3 +188,30 @@ class CHColumnarShuffleWriter[K, V](
   def getPartitionLengths(): Array[Long] = partitionLengths
 
 }
+
+object CHColumnarShuffleWriter {
+  def setOutputMetrics(splitResult: CHSplitResult): Unit = {
+    TaskContext
+      .get()
+      .getLocalProperties
+      .setProperty("total_output_rows", splitResult.getTotalRows.toString)
+    TaskContext
+      .get()
+      .getLocalProperties
+      .setProperty("total_output_batches", splitResult.getTotalBatches.toString)
+  }
+
+  def getTotalOutputRows(): Long = {
+    val output_rows = TaskContext.get().getLocalProperty("total_output_rows")
+    var output_rows_value = 0L
+    if (output_rows != null && output_rows.nonEmpty) output_rows_value = output_rows.toLong
+    output_rows_value
+  }
+
+  def getTotalOutputBatches(): Long = {
+    val output_batches = TaskContext.get().getLocalProperty("total_output_batches")
+    var output_batches_value = 0L
+    if (output_batches != null) output_batches_value = output_batches.toLong
+    output_batches_value
+  }
+}
diff --git a/...src/test/scala/org/apache/gluten/execution/metrics/GlutenClickHouseTPCHMetricsSuite.scala b/...src/test/scala/org/apache/gluten/execution/metrics/GlutenClickHouseTPCHMetricsSuite.scala
@@ -103,8 +103,8 @@ class GlutenClickHouseTPCHMetricsSuite extends GlutenClickHouseTPCHAbstractSuite
           case scanExec: BasicScanExecTransformer => scanExec
         }
         assert(plans.size == 1)
-        // 1 block keep in SubstraitFileStep, and 4 blocks keep in other steps
-        assert(plans.head.metrics("numOutputRows").value === 5 * parquetMaxBlockSize)
+        // 1 block keep in SubstraitFileStep, and 5 blocks keep in other steps
+        assert(plans.head.metrics("numOutputRows").value === 6 * parquetMaxBlockSize)
         assert(plans.head.metrics("outputVectors").value === 1)
         assert(plans.head.metrics("outputBytes").value > 0)
     }

diff --git a/cpp-ch/local-engine/Common/common.cpp b/cpp-ch/local-engine/Common/common.cpp
diff --git a/cpp-ch/local-engine/Parser/LocalExecutor.cpp b/cpp-ch/local-engine/Parser/LocalExecutor.cpp
@@ -0,0 +1,186 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "LocalExecutor.h"
+
+#include <Common/QueryContext.h>
+#include <QueryPipeline/printPipeline.h>
+#include <Processors/Executors/PipelineExecutor.h>
+#include <Core/Settings.h>
+
+#include "SerializedPlanParser.h"
+
+using namespace DB;
+namespace local_engine
+{
+
+LocalExecutor::~LocalExecutor()
+{
+    if (dump_pipeline)
+        LOG_INFO(&Poco::Logger::get("LocalExecutor"), "Dump pipeline:\n{}", dumpPipeline());
+
+    if (spark_buffer)
+    {
+        ch_column_to_spark_row->freeMem(spark_buffer->address, spark_buffer->size);
+        spark_buffer.reset();
+    }
+}
+
+std::unique_ptr<SparkRowInfo> LocalExecutor::writeBlockToSparkRow(const Block & block) const
+{
+    return ch_column_to_spark_row->convertCHColumnToSparkRow(block);
+}
+
+void LocalExecutor::initPullingPipelineExecutor()
+{
+    if (!executor)
+    {
+        query_pipeline = QueryPipelineBuilder::getPipeline(std::move(*query_pipeline_builder));
+        query_pipeline.setNumThreads(1);
+        executor = std::make_unique<PullingAsyncPipelineExecutor>(query_pipeline);
+    }
+}
+
+bool LocalExecutor::hasNext()
+{
+    initPullingPipelineExecutor();
+    size_t columns = currentBlock().columns();
+    if (columns == 0 || isConsumed())
+    {
+        auto empty_block = header.cloneEmpty();
+        setCurrentBlock(empty_block);
+        bool has_next = executor->pull(currentBlock());
+        produce();
+        return has_next;
+    }
+    return true;
+}
+
+bool LocalExecutor::fallbackMode()
+{
+    if (executor.get() || fallback_mode)
+        std::cerr << fmt::format("executor {} in fallback mode\n", reinterpret_cast<long>(this));
+    else
+        std::cerr << fmt::format("executor {} not in fallback mode\n", reinterpret_cast<long>(this));
+    return executor.get() || fallback_mode;
+}
+
+SparkRowInfoPtr LocalExecutor::next()
+{
+    checkNextValid();
+    SparkRowInfoPtr row_info = writeBlockToSparkRow(currentBlock());
+    consume();
+    if (spark_buffer)
+    {
+        ch_column_to_spark_row->freeMem(spark_buffer->address, spark_buffer->size);
+        spark_buffer.reset();
+    }
+    spark_buffer = std::make_unique<SparkBuffer>();
+    spark_buffer->address = row_info->getBufferAddress();
+    spark_buffer->size = row_info->getTotalBytes();
+    std::cerr << "call next\n";
+    return row_info;
+}
+Block * LocalExecutor::nextColumnar()
+{
+    checkNextValid();
+    Block * columnar_batch;
+    if (currentBlock().columns() > 0)
+    {
+        columnar_batch = &currentBlock();
+    }
+    else
+    {
+        auto empty_block = header.cloneEmpty();
+        setCurrentBlock(empty_block);
+        columnar_batch = &currentBlock();
+    }
+    consume();
+    return columnar_batch;
+}
+
+void LocalExecutor::cancel()
+{
+    if (executor)
+        executor->cancel();
+    if (push_executor)
+        push_executor->cancel();
+}
+
+void LocalExecutor::setSinks(std::function<void(DB::QueryPipelineBuilder &)> setter)
+{
+    setter(*query_pipeline_builder);
+}
+
+void LocalExecutor::setExternalPipelineBuilder(DB::QueryPipelineBuilderPtr builder)
+{
+    external_pipeline_builder = std::move(builder);
+}
+
+void LocalExecutor::execute()
+{
+    chassert(query_pipeline_builder || external_pipeline_builder);
+    if (external_pipeline_builder)
+        push_executor = external_pipeline_builder->execute();
+    else
+        push_executor = query_pipeline_builder->execute();
+    push_executor->execute(local_engine::QueryContextManager::instance().currentQueryContext()->getSettingsRef().max_threads, false);
+}
+
+Block LocalExecutor::getHeader()
+{
+    return header;
+}
+
+LocalExecutor::LocalExecutor(QueryPlanPtr query_plan, QueryPipelineBuilderPtr pipeline_builder, bool dump_pipeline_)
+    : query_pipeline_builder(std::move(pipeline_builder))
+    , header(query_plan->getCurrentDataStream().header.cloneEmpty())
+    , dump_pipeline(dump_pipeline_)
+    , ch_column_to_spark_row(std::make_unique<CHColumnToSparkRow>())
+    , current_query_plan(std::move(query_plan))
+{
+    if (current_executor)
+    {
+        fallback_mode = true;
+    }
+    // only need record last executor
+    current_executor = this;
+}
+thread_local LocalExecutor * LocalExecutor::current_executor = nullptr;
+std::string LocalExecutor::dumpPipeline() const
+{
+    const auto & processors = query_pipeline.getProcessors();
+    for (auto & processor : processors)
+    {
+        WriteBufferFromOwnString buffer;
+        auto data_stats = processor->getProcessorDataStats();
+        buffer << "(";
+        buffer << "\nexecution time: " << processor->getElapsedNs() / 1000U << " us.";
+        buffer << "\ninput wait time: " << processor->getInputWaitElapsedNs() / 1000U << " us.";
+        buffer << "\noutput wait time: " << processor->getOutputWaitElapsedNs() / 1000U << " us.";
+        buffer << "\ninput rows: " << data_stats.input_rows;
+        buffer << "\ninput bytes: " << data_stats.input_bytes;
+        buffer << "\noutput rows: " << data_stats.output_rows;
+        buffer << "\noutput bytes: " << data_stats.output_bytes;
+        buffer << ")";
+        processor->setDescription(buffer.str());
+    }
+    WriteBufferFromOwnString out;
+    DB::printPipeline(processors, out);
+    return out.str();
+}
+}
-Original file line number
+Diff line change
@@ Expand Up @@
             }
           }
       }
+      override def supportNativeInputFileRelatedExpr(): Boolean = true
     }