apache · onursatici · Jul 18, 2018 · Jul 19, 2018 · Jul 20, 2018 · Jul 23, 2018
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala
@@ -50,6 +50,8 @@ case class CachedRDDBuilder(
     tableName: Option[String])(
     @transient private var _cachedColumnBuffers: RDD[CachedBatch] = null) {
 
+  override def toString: String = s"CachedRDDBuilder($useCompression, $batchSize, $storageLevel)"
+
   val sizeInBytesStats: LongAccumulator = cachedPlan.sqlContext.sparkContext.longAccumulator
 
   def cachedColumnBuffers: RDD[CachedBatch] = {

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala
@@ -206,4 +206,19 @@ class DatasetCacheSuite extends QueryTest with SharedSQLContext with TimeLimits
     // first time use, load cache
     checkDataset(df5, Row(10))
   }
+
+  test("SPARK-24850 InMemoryRelation string representation does not include cached plan") {
+    val dummyQueryExecution = spark.range(0, 1).toDF().queryExecution
+    val inMemoryRelation = InMemoryRelation(
+      true,
+      1000,
+      StorageLevel.MEMORY_ONLY,
+      dummyQueryExecution.sparkPlan,
+      Some("test-relation"),
+      dummyQueryExecution.logical)
+
+    assert(!inMemoryRelation.simpleString.contains(dummyQueryExecution.sparkPlan.toString))
+    assert(inMemoryRelation.simpleString.contains(
+      "CachedRDDBuilder(true, 1000, StorageLevel(memory, deserialized, 1 replicas))"))
+  }
 }