Move more code to Java; fix bugs in UnsafeRowConverter length type.

JoshRosen · JoshRosen · commit 9cc98f5f3e74 · 2015-07-06T11:51:11.000-07:00
The length type is an int, not long, but the code was inconsistent about
this.  I also now use byte arrays instead of long arrays in some places
in order to avoid off-by-factor-of-8 errors.
diff --git a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java
@@ -151,7 +151,7 @@ public long freeMemory() {
     return memoryFreed;
   }
 
-  private void ensureSpaceInDataPage(int requiredSpace) throws Exception {
+  private void ensureSpaceInDataPage(int requiredSpace) throws IOException {
     // TODO: merge these steps to first calculate total memory requirements for this insert,
     // then try to acquire; no point in acquiring sort buffer only to spill due to no space in the
     // data page.
@@ -176,7 +176,7 @@ private void ensureSpaceInDataPage(int requiredSpace) throws Exception {
     }
     if (requiredSpace > PAGE_SIZE) {
       // TODO: throw a more specific exception?
-      throw new Exception("Required space " + requiredSpace + " is greater than page size (" +
+      throw new IOException("Required space " + requiredSpace + " is greater than page size (" +
         PAGE_SIZE + ")");
     } else if (requiredSpace > spaceInCurrentPage) {
       if (spillingEnabled) {
@@ -187,7 +187,7 @@ private void ensureSpaceInDataPage(int requiredSpace) throws Exception {
           final long memoryAcquiredAfterSpill = shuffleMemoryManager.tryToAcquire(PAGE_SIZE);
           if (memoryAcquiredAfterSpill != PAGE_SIZE) {
             shuffleMemoryManager.release(memoryAcquiredAfterSpill);
-            throw new Exception("Can't allocate memory!");
+            throw new IOException("Can't allocate memory!");
           }
         }
       }
@@ -202,7 +202,7 @@ public void insertRecord(
       Object recordBaseObject,
       long recordBaseOffset,
       int lengthInBytes,
-      long prefix) throws Exception {
+      long prefix) throws IOException {
     // Need 4 bytes to store the record length.
     ensureSpaceInDataPage(lengthInBytes + 4);
 
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/UnsafeRow.java b/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/UnsafeRow.java
@@ -17,6 +17,11 @@
 
 package org.apache.spark.sql.catalyst.expressions;
 
+import java.math.BigDecimal;
+import java.sql.Date;
+import java.util.*;
+import javax.annotation.Nullable;
+
 import org.apache.spark.sql.catalyst.InternalRow;
 import org.apache.spark.sql.catalyst.util.ObjectPool;
 import org.apache.spark.unsafe.PlatformDependent;
@@ -55,6 +60,8 @@
  */
 public final class UnsafeRow extends MutableRow {
 
+  /** Hack for if we want to pass around an UnsafeRow which also carries around its backing data */
+  @Nullable public byte[] backingArray;
   private Object baseObject;
   private long baseOffset;
 
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java b/sql/catalyst/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java
@@ -0,0 +1,171 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution;
+
+import java.io.IOException;
+import java.util.Arrays;
+
+import scala.Function1;
+import scala.collection.AbstractIterator;
+import scala.collection.Iterator;
+import scala.math.Ordering;
+
+import org.apache.spark.SparkEnv;
+import org.apache.spark.TaskContext;
+import org.apache.spark.sql.Row;
+import org.apache.spark.sql.catalyst.expressions.UnsafeRow;
+import org.apache.spark.sql.catalyst.expressions.UnsafeRowConverter;
+import org.apache.spark.sql.types.StructType;
+import org.apache.spark.unsafe.PlatformDependent;
+import org.apache.spark.util.collection.unsafe.sort.PrefixComparator;
+import org.apache.spark.util.collection.unsafe.sort.RecordComparator;
+import org.apache.spark.util.collection.unsafe.sort.UnsafeExternalSorter;
+import org.apache.spark.util.collection.unsafe.sort.UnsafeSorterIterator;
+
+final class UnsafeExternalRowSorter {
+
+  private final StructType schema;
+  private final UnsafeRowConverter rowConverter;
+  private final RowComparator rowComparator;
+  private final PrefixComparator prefixComparator;
+  private final Function1<Row, Long> prefixComputer;
+
+  public UnsafeExternalRowSorter(
+      StructType schema,
+      Ordering<Row> ordering,
+      PrefixComparator prefixComparator,
+      // TODO: if possible, avoid this boxing of the return value
+      Function1<Row, Long> prefixComputer) {
+    this.schema = schema;
+    this.rowConverter = new UnsafeRowConverter(schema);
+    this.rowComparator = new RowComparator(ordering, schema);
+    this.prefixComparator = prefixComparator;
+    this.prefixComputer = prefixComputer;
+  }
+
+  public Iterator<Row> sort(Iterator<Row> inputIterator) throws IOException {
+    final SparkEnv sparkEnv = SparkEnv.get();
+    final TaskContext taskContext = TaskContext.get();
+    byte[] rowConversionBuffer = new byte[1024 * 8];
+    final UnsafeExternalSorter sorter = new UnsafeExternalSorter(
+      taskContext.taskMemoryManager(),
+      sparkEnv.shuffleMemoryManager(),
+      sparkEnv.blockManager(),
+      taskContext,
+      rowComparator,
+      prefixComparator,
+      4096,
+      sparkEnv.conf()
+    );
+    try {
+      while (inputIterator.hasNext()) {
+        final Row row = inputIterator.next();
+        final int sizeRequirement = rowConverter.getSizeRequirement(row);
+        if (sizeRequirement > rowConversionBuffer.length) {
+          rowConversionBuffer = new byte[sizeRequirement];
+        } else {
+          // Zero out the buffer that's used to hold the current row. This is necessary in order
+          // to ensure that rows hash properly, since garbage data from the previous row could
+          // otherwise end up as padding in this row. As a performance optimization, we only zero
+          // out the portion of the buffer that we'll actually write to.
+          Arrays.fill(rowConversionBuffer, 0, sizeRequirement, (byte) 0);
+        }
+        final int bytesWritten =
+          rowConverter.writeRow(row, rowConversionBuffer, PlatformDependent.BYTE_ARRAY_OFFSET);
+        assert (bytesWritten == sizeRequirement);
+        final long prefix = prefixComputer.apply(row);
+        sorter.insertRecord(
+          rowConversionBuffer,
+          PlatformDependent.BYTE_ARRAY_OFFSET,
+          sizeRequirement,
+          prefix
+        );
+      }
+      final UnsafeSorterIterator sortedIterator = sorter.getSortedIterator();
+      return new AbstractIterator<Row>() {
+
+        private final int numFields = schema.length();
+        private final UnsafeRow row = new UnsafeRow();
+
+        @Override
+        public boolean hasNext() {
+          return sortedIterator.hasNext();
+        }
+
+        @Override
+        public Row next() {
+          try {
+            sortedIterator.loadNext();
+            if (hasNext()) {
+              row.pointTo(
+                sortedIterator.getBaseObject(), sortedIterator.getBaseOffset(), numFields, schema);
+              return row;
+            } else {
+              final byte[] rowDataCopy = new byte[sortedIterator.getRecordLength()];
+              PlatformDependent.copyMemory(
+                sortedIterator.getBaseObject(),
+                sortedIterator.getBaseOffset(),
+                rowDataCopy,
+                PlatformDependent.BYTE_ARRAY_OFFSET,
+                sortedIterator.getRecordLength()
+              );
+              row.backingArray = rowDataCopy;
+              row.pointTo(rowDataCopy, PlatformDependent.BYTE_ARRAY_OFFSET, numFields, schema);
+              sorter.freeMemory();
+              return row;
+            }
+          } catch (IOException e) {
+            // TODO: we need to ensure that files are cleaned properly after an exception,
+            // so we need better cleanup methods than freeMemory().
+            sorter.freeMemory();
+            // Scala iterators don't declare any checked exceptions, so we need to use this hack
+            // to re-throw the exception:
+            PlatformDependent.throwException(e);
+          }
+          throw new RuntimeException("Exception should have been re-thrown in next()");
+        };
+      };
+    } catch (IOException e) {
+      // TODO: we need to ensure that files are cleaned properly after an exception,
+      // so we need better cleanup methods than freeMemory().
+      sorter.freeMemory();
+      throw e;
+    }
+  }
+
+  private static final class RowComparator extends RecordComparator {
+    private final StructType schema;
+    private final Ordering<Row> ordering;
+    private final int numFields;
+    private final UnsafeRow row1 = new UnsafeRow();
+    private final UnsafeRow row2 = new UnsafeRow();
+
+    public RowComparator(Ordering<Row> ordering, StructType schema) {
+      this.schema = schema;
+      this.numFields = schema.length();
+      this.ordering = ordering;
+    }
+
+    @Override
+    public int compare(Object baseObj1, long baseOff1, Object baseObj2, long baseOff2) {
+      row1.pointTo(baseObj1, baseOff1, numFields, schema);
+      row2.pointTo(baseObj2, baseOff2, numFields, schema);
+      return ordering.compare(row1, row2);
+    }
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/basicOperators.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/basicOperators.scala
@@ -17,12 +17,9 @@
 
 package org.apache.spark.sql.execution
 
-import java.util.Arrays
-
 import org.apache.spark.sql.types.StructType
-import org.apache.spark.unsafe.PlatformDependent
-import org.apache.spark.util.collection.unsafe.sort.{RecordComparator, PrefixComparator, UnsafeExternalSorter}
-import org.apache.spark.{TaskContext, SparkEnv, HashPartitioner, SparkConf}
+import org.apache.spark.util.collection.unsafe.sort.PrefixComparator
+import org.apache.spark.{SparkEnv, HashPartitioner}
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.rdd.{RDD, ShuffledRDD}
 import org.apache.spark.shuffle.sort.SortShuffleManager
@@ -272,87 +269,14 @@ case class UnsafeExternalSort(
     if (global) OrderedDistribution(sortOrder) :: Nil else UnspecifiedDistribution :: Nil
 
   protected override def doExecute(): RDD[Row] = attachTree(this, "sort") {
-    // TODO(josh): This code is unreadably messy; this should be split into a separate file
-    // and written in Java.
     assert (codegenEnabled)
     def doSort(iterator: Iterator[Row]): Iterator[Row] = {
       val ordering = newOrdering(sortOrder, child.output)
-      val rowConverter = new UnsafeRowConverter(schema.map(_.dataType).toArray)
-      var rowConversionScratchSpace = new Array[Long](1024)
       val prefixComparator = new PrefixComparator {
         override def compare(prefix1: Long, prefix2: Long): Int = 0
       }
-      val recordComparator = new RecordComparator {
-        private[this] val row1 = new UnsafeRow
-        private[this] val row2 = new UnsafeRow
-        override def compare(
-            baseObj1: scala.Any, baseOff1: Long, baseObj2: scala.Any, baseOff2: Long): Int = {
-          row1.pointTo(baseObj1, baseOff1, numFields, schema)
-          row2.pointTo(baseObj2, baseOff2, numFields, schema)
-          ordering.compare(row1, row2)
-        }
-      }
-      val sorter = new UnsafeExternalSorter(
-        TaskContext.get.taskMemoryManager(),
-        SparkEnv.get.shuffleMemoryManager,
-        SparkEnv.get.blockManager,
-        TaskContext.get,
-        recordComparator,
-        prefixComparator,
-        4096,
-        SparkEnv.get.conf
-      )
-      while (iterator.hasNext) {
-        val row: Row = iterator.next()
-        val sizeRequirement = rowConverter.getSizeRequirement(row)
-        if (sizeRequirement / 8 > rowConversionScratchSpace.length) {
-          rowConversionScratchSpace = new Array[Long](sizeRequirement / 8)
-        } else {
-          // Zero out the buffer that's used to hold the current row. This is necessary in order
-          // to ensure that rows hash properly, since garbage data from the previous row could
-          // otherwise end up as padding in this row. As a performance optimization, we only zero
-          // out the portion of the buffer that we'll actually write to.
-          Arrays.fill(rowConversionScratchSpace, 0, sizeRequirement / 8, 0)
-        }
-        val bytesWritten =
-          rowConverter.writeRow(row, rowConversionScratchSpace, PlatformDependent.LONG_ARRAY_OFFSET)
-        assert (bytesWritten == sizeRequirement)
-        val prefix: Long = 0  // dummy prefix until we implement prefix calculation
-        sorter.insertRecord(
-          rowConversionScratchSpace,
-          PlatformDependent.LONG_ARRAY_OFFSET,
-          sizeRequirement,
-          prefix
-        )
-      }
-      val sortedIterator = sorter.getSortedIterator
-      // TODO: need to avoid memory leaks on exceptions, etc. by wrapping in resource cleanup blocks
-      // TODO: need to clean up spill files after success or failure.
-      new Iterator[Row] {
-        private[this] val row = new UnsafeRow()
-        override def hasNext: Boolean = sortedIterator.hasNext
-
-        override def next(): Row = {
-          sortedIterator.loadNext()
-          if (hasNext) {
-            row.pointTo(
-              sortedIterator.getBaseObject, sortedIterator.getBaseOffset, numFields, schema)
-            row
-          } else {
-            val rowDataCopy = new Array[Byte](sortedIterator.getRecordLength)
-            PlatformDependent.copyMemory(
-              sortedIterator.getBaseObject,
-              sortedIterator.getBaseOffset,
-              rowDataCopy,
-              PlatformDependent.BYTE_ARRAY_OFFSET,
-              sortedIterator.getRecordLength
-            )
-            row.pointTo(rowDataCopy, PlatformDependent.BYTE_ARRAY_OFFSET, numFields, schema)
-            sorter.freeMemory()
-            row
-          }
-        }
-      }
+      def prefixComputer(row: Row): Long = 0
+      new UnsafeExternalRowSorter(schema, ordering, prefixComparator, prefixComputer).sort(iterator)
     }
     child.execute().mapPartitions(doSort, preservesPartitioning = true)
   }