Add an Ordering for NullWritable to make the compiler generate same b…

…yte codes for RDD
apache · Dec 19, 2014 · fa40db0 · fa40db0
1 parent 9804a75
commit fa40db0
Showing 1 changed file with 12 additions and 0 deletions.
diff --git a/core/src/main/scala/org/apache/spark/rdd/RDD.scala b/core/src/main/scala/org/apache/spark/rdd/RDD.scala
@@ -1174,6 +1174,14 @@ abstract class RDD[T: ClassTag](
    * Save this RDD as a text file, using string representations of elements.
    */
   def saveAsTextFile(path: String) {
+    // https://issues.apache.org/jira/browse/SPARK-2075
+    // NullWritable is a Comparable rather than Comparable[NullWritable] in Hadoop 1.+,
+    // so the compiler cannot find an implicit Ordering for it. It will generate different
+    // anonymous classes for `saveAsTextFile` in Hadoop 1.+ and Hadoop 2.+. Therefore, here we
+    // provide an Ordering for NullWritable so that the compiler will generate same codes.
+    implicit val nullWritableOrdering = new Ordering[NullWritable] {
+      override def compare(x: NullWritable, y: NullWritable): Int = 0
+    }
     this.map(x => (NullWritable.get(), new Text(x.toString)))
       .saveAsHadoopFile[TextOutputFormat[NullWritable, Text]](path)
   }
@@ -1182,6 +1190,10 @@ abstract class RDD[T: ClassTag](
    * Save this RDD as a compressed text file, using string representations of elements.
    */
   def saveAsTextFile(path: String, codec: Class[_ <: CompressionCodec]) {
+    // https://issues.apache.org/jira/browse/SPARK-2075
+    implicit val nullWritableOrdering = new Ordering[NullWritable] {
+      override def compare(x: NullWritable, y: NullWritable): Int = 0
+    }
     this.map(x => (NullWritable.get(), new Text(x.toString)))
       .saveAsHadoopFile[TextOutputFormat[NullWritable, Text]](path, codec)
   }