Skip to content

Commit 80b2166

Browse files
committed
Add comment on filtering null semantic
1 parent 37c4539 commit 80b2166

File tree

1 file changed

+2
-0
lines changed
  • sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate

1 file changed

+2
-0
lines changed

sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/collect.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ abstract class Collect extends ImperativeAggregate {
6565
}
6666

6767
override def update(b: MutableRow, input: InternalRow): Unit = {
68+
// Do not allow null values. We follow the semantics of Hive's collect_list/collect_set here.
69+
// See: org.apache.hadoop.hive.ql.udf.generic.GenericUDAFMkCollectionEvaluator
6870
val value = child.eval(input)
6971
if (value != null) {
7072
buffer += value

0 commit comments

Comments
 (0)