From cfbafebb551fdaecbc522647f0763572959fe52a Mon Sep 17 00:00:00 2001 From: lgbo Date: Tue, 3 Sep 2024 19:54:08 +0800 Subject: [PATCH] have_compressed is lost in HashJoin::reuseJoinedData (#7083) --- .../execution/GlutenClickHouseTPCHSuite.scala | 16 ++++++++++++++++ cpp-ch/clickhouse.version | 2 +- 2 files changed, 17 insertions(+), 1 deletion(-) diff --git a/backends-clickhouse/src/test/scala/org/apache/gluten/execution/GlutenClickHouseTPCHSuite.scala b/backends-clickhouse/src/test/scala/org/apache/gluten/execution/GlutenClickHouseTPCHSuite.scala index 93c13d15c6ce..c517afcb2905 100644 --- a/backends-clickhouse/src/test/scala/org/apache/gluten/execution/GlutenClickHouseTPCHSuite.scala +++ b/backends-clickhouse/src/test/scala/org/apache/gluten/execution/GlutenClickHouseTPCHSuite.scala @@ -531,5 +531,21 @@ class GlutenClickHouseTPCHSuite extends GlutenClickHouseTPCHAbstractSuite { spark.sql("drop table t1") spark.sql("drop table t2") } + + test("gluten-7077 bug in cross broad cast join") { + spark.sql("create table cross_join_t(a bigint, b string, c string) using parquet"); + var sql = """ + | insert into cross_join_t + | select id as a, cast(id as string) as b, + | concat('1231231232323232322', cast(id as string)) as c + | from range(0, 100000) + |""".stripMargin + spark.sql(sql) + sql = """ + | select * from cross_join_t as t1 full join cross_join_t as t2 limit 10 + |""".stripMargin + compareResultsAgainstVanillaSpark(sql, true, { _ => }) + spark.sql("drop table cross_join_t") + } } // scalastyle:off line.size.limit diff --git a/cpp-ch/clickhouse.version b/cpp-ch/clickhouse.version index 486c96a540e3..8859c650a85c 100644 --- a/cpp-ch/clickhouse.version +++ b/cpp-ch/clickhouse.version @@ -1,3 +1,3 @@ CH_ORG=Kyligence CH_BRANCH=rebase_ch/20240830 -CH_COMMIT=fc5f00d8cb7 \ No newline at end of file +CH_COMMIT=d239aeff645