From 9eeecad4aaea5f555d3c1d8441e312ae9eda7326 Mon Sep 17 00:00:00 2001 From: Allen Xu Date: Thu, 8 Apr 2021 00:30:21 +0800 Subject: [PATCH] Enable orc write (#2084) Re-enable the orc write since https://github.com/NVIDIA/spark-rapids/issues/1550 has been fixed Signed-off-by: Allen Xu --- docs/configs.md | 2 +- .../src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala | 5 ++--- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/docs/configs.md b/docs/configs.md index a65ca2db758..7e0b3ae758b 100644 --- a/docs/configs.md +++ b/docs/configs.md @@ -68,7 +68,7 @@ Name | Description | Default Value spark.rapids.sql.format.csv.read.enabled|When set to false disables csv input acceleration|true spark.rapids.sql.format.orc.enabled|When set to false disables all orc input and output acceleration|true spark.rapids.sql.format.orc.read.enabled|When set to false disables orc input acceleration|true -spark.rapids.sql.format.orc.write.enabled|When set to false disables orc output acceleration. This has been disabled by default because of https://github.com/NVIDIA/spark-rapids/issues/1550|false +spark.rapids.sql.format.orc.write.enabled|When set to false disables orc output acceleration|true spark.rapids.sql.format.parquet.enabled|When set to false disables all parquet input and output acceleration|true spark.rapids.sql.format.parquet.multiThreadedRead.maxNumFilesParallel|A limit on the maximum number of files per task processed in parallel on the CPU side before the file is sent to the GPU. This affects the amount of host memory used when reading the files in parallel. Used with MULTITHREADED reader, see spark.rapids.sql.format.parquet.reader.type|2147483647 spark.rapids.sql.format.parquet.multiThreadedRead.numThreads|The maximum number of threads, on the executor, to use for reading small parquet files in parallel. This can not be changed at runtime after the executor has started. Used with COALESCING and MULTITHREADED reader, see spark.rapids.sql.format.parquet.reader.type.|20 diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala index 9a2392a2bdb..753dc8c4185 100644 --- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala +++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala @@ -701,10 +701,9 @@ object RapidsConf { .createWithDefault(true) val ENABLE_ORC_WRITE = conf("spark.rapids.sql.format.orc.write.enabled") - .doc("When set to false disables orc output acceleration. This has been disabled by " + - "default because of https://github.com/NVIDIA/spark-rapids/issues/1550") + .doc("When set to false disables orc output acceleration") .booleanConf - .createWithDefault(false) + .createWithDefault(true) val ENABLE_CSV = conf("spark.rapids.sql.format.csv.enabled") .doc("When set to false disables all csv input and output acceleration. " +