apache · Ngone51 · Mar 18, 2021 · Apr 2, 2021 · Apr 2, 2021 · Apr 2, 2021
diff --git a/core/src/main/scala/org/apache/spark/MapOutputTracker.scala b/core/src/main/scala/org/apache/spark/MapOutputTracker.scala
@@ -35,7 +35,7 @@ import org.apache.spark.internal.Logging
 import org.apache.spark.internal.config._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.rpc.{RpcCallContext, RpcEndpoint, RpcEndpointRef, RpcEnv}
-import org.apache.spark.scheduler.MapStatus
+import org.apache.spark.scheduler.{Location, MapStatus}
 import org.apache.spark.shuffle.MetadataFetchFailedException
 import org.apache.spark.storage.{BlockId, BlockManagerId, ShuffleBlockId}
 import org.apache.spark.util._
@@ -124,13 +124,13 @@ private class ShuffleStatus(numPartitions: Int) extends Logging {
   /**
    * Update the map output location (e.g. during migration).
    */
-  def updateMapOutput(mapId: Long, bmAddress: BlockManagerId): Unit = withWriteLock {
+  def updateMapOutput(mapId: Long, loc: Location): Unit = withWriteLock {
     try {
       val mapStatusOpt = mapStatuses.find(_.mapId == mapId)
       mapStatusOpt match {
         case Some(mapStatus) =>
-          logInfo(s"Updating map output for ${mapId} to ${bmAddress}")
-          mapStatus.updateLocation(bmAddress)
+          logInfo(s"Updating map output for $mapId to $loc")
+          mapStatus.updateLocation(loc)
           invalidateSerializedMapOutputStatusCache()
         case None =>
           logWarning(s"Asked to update map output ${mapId} for untracked map status.")
@@ -146,9 +146,9 @@ private class ShuffleStatus(numPartitions: Int) extends Logging {
    * This is a no-op if there is no registered map output or if the registered output is from a
    * different block manager.
    */
-  def removeMapOutput(mapIndex: Int, bmAddress: BlockManagerId): Unit = withWriteLock {
-    logDebug(s"Removing existing map output ${mapIndex} ${bmAddress}")
-    if (mapStatuses(mapIndex) != null && mapStatuses(mapIndex).location == bmAddress) {
+  def removeMapOutput(mapIndex: Int, loc: Location): Unit = withWriteLock {
+    logDebug(s"Removing existing map output $mapIndex $loc")
+    if (mapStatuses(mapIndex) != null && mapStatuses(mapIndex).location == loc) {
       _numAvailableOutputs -= 1
       mapStatuses(mapIndex) = null
       invalidateSerializedMapOutputStatusCache()
@@ -178,7 +178,7 @@ private class ShuffleStatus(numPartitions: Int) extends Logging {
    * Removes all shuffle outputs which satisfies the filter. Note that this will also
    * remove outputs which are served by an external shuffle server (if one exists).
    */
-  def removeOutputsByFilter(f: BlockManagerId => Boolean): Unit = withWriteLock {
+  def removeOutputsByFilter(f: Location => Boolean): Unit = withWriteLock {
     for (mapIndex <- mapStatuses.indices) {
       if (mapStatuses(mapIndex) != null && f(mapStatuses(mapIndex).location)) {
         _numAvailableOutputs -= 1
@@ -344,7 +344,7 @@ private[spark] abstract class MapOutputTracker(conf: SparkConf) extends Logging
 
   // For testing
   def getMapSizesByExecutorId(shuffleId: Int, reduceId: Int)
-      : Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])] = {
+      : Iterator[(Location, Seq[(BlockId, Long, Int)])] = {
     getMapSizesByExecutorId(shuffleId, 0, Int.MaxValue, reduceId, reduceId + 1)
   }
 
@@ -365,7 +365,7 @@ private[spark] abstract class MapOutputTracker(conf: SparkConf) extends Logging
       startMapIndex: Int,
       endMapIndex: Int,
       startPartition: Int,
-      endPartition: Int): Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])]
+      endPartition: Int): Iterator[(Location, Seq[(BlockId, Long, Int)])]
 
   /**
    * Deletes map output status information for the specified shuffle stage.
@@ -502,7 +502,7 @@ private[spark] class MapOutputTrackerMaster(
   }
 
   /** Unregister map output information of the given shuffle, mapper and block manager */
-  def unregisterMapOutput(shuffleId: Int, mapIndex: Int, bmAddress: BlockManagerId): Unit = {
+  def unregisterMapOutput(shuffleId: Int, mapIndex: Int, bmAddress: Location): Unit = {
     shuffleStatuses.get(shuffleId) match {
       case Some(shuffleStatus) =>
         shuffleStatus.removeMapOutput(mapIndex, bmAddress)
@@ -643,10 +643,10 @@ private[spark] class MapOutputTrackerMaster(
       : Seq[String] = {
     if (shuffleLocalityEnabled && dep.rdd.partitions.length < SHUFFLE_PREF_MAP_THRESHOLD &&
         dep.partitioner.numPartitions < SHUFFLE_PREF_REDUCE_THRESHOLD) {
-      val blockManagerIds = getLocationsWithLargestOutputs(dep.shuffleId, partitionId,
+      val locations = getLocationsWithLargestOutputs(dep.shuffleId, partitionId,
         dep.partitioner.numPartitions, REDUCER_PREF_LOCS_FRACTION)
-      if (blockManagerIds.nonEmpty) {
-        blockManagerIds.get.map(_.host)
+      if (locations.nonEmpty) {
+        locations.get.map(_.host)
       } else {
         Nil
       }
@@ -670,14 +670,14 @@ private[spark] class MapOutputTrackerMaster(
       reducerId: Int,
       numReducers: Int,
       fractionThreshold: Double)
-    : Option[Array[BlockManagerId]] = {
+    : Option[Array[Location]] = {
 
     val shuffleStatus = shuffleStatuses.get(shuffleId).orNull
     if (shuffleStatus != null) {
       shuffleStatus.withMapStatuses { statuses =>
         if (statuses.nonEmpty) {
           // HashMap to add up sizes of all blocks at the same location
-          val locs = new HashMap[BlockManagerId, Long]
+          val locs = new HashMap[Location, Long]
           var totalOutputSize = 0L
           var mapIdx = 0
           while (mapIdx < statuses.length) {
@@ -758,7 +758,7 @@ private[spark] class MapOutputTrackerMaster(
       startMapIndex: Int,
       endMapIndex: Int,
       startPartition: Int,
-      endPartition: Int): Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])] = {
+      endPartition: Int): Iterator[(Location, Seq[(BlockId, Long, Int)])] = {
     logDebug(s"Fetching outputs for shuffle $shuffleId")
     shuffleStatuses.get(shuffleId) match {
       case Some(shuffleStatus) =>
@@ -810,7 +810,7 @@ private[spark] class MapOutputTrackerWorker(conf: SparkConf) extends MapOutputTr
       startMapIndex: Int,
       endMapIndex: Int,
       startPartition: Int,
-      endPartition: Int): Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])] = {
+      endPartition: Int): Iterator[(Location, Seq[(BlockId, Long, Int)])] = {
     logDebug(s"Fetching outputs for shuffle $shuffleId")
     val statuses = getStatuses(shuffleId, conf)
     try {
@@ -989,9 +989,9 @@ private[spark] object MapOutputTracker extends Logging {
       endPartition: Int,
       statuses: Array[MapStatus],
       startMapIndex : Int,
-      endMapIndex: Int): Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])] = {
+      endMapIndex: Int): Iterator[(Location, Seq[(BlockId, Long, Int)])] = {
     assert (statuses != null)
-    val splitsByAddress = new HashMap[BlockManagerId, ListBuffer[(BlockId, Long, Int)]]
+    val splitsByAddress = new HashMap[Location, ListBuffer[(BlockId, Long, Int)]]
     val iter = statuses.iterator.zipWithIndex
     for ((status, mapIndex) <- iter.slice(startMapIndex, endMapIndex)) {
       if (status == null) {

diff --git a/core/src/main/scala/org/apache/spark/TaskEndReason.scala b/core/src/main/scala/org/apache/spark/TaskEndReason.scala
@@ -21,8 +21,7 @@ import java.io.{ObjectInputStream, ObjectOutputStream}
 
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.internal.Logging
-import org.apache.spark.scheduler.AccumulableInfo
-import org.apache.spark.storage.BlockManagerId
+import org.apache.spark.scheduler.{AccumulableInfo, Location}
 import org.apache.spark.util.{AccumulatorV2, Utils}
 
 // ==============================================================================================
@@ -81,7 +80,7 @@ case object Resubmitted extends TaskFailedReason {
  */
 @DeveloperApi
 case class FetchFailed(
-    bmAddress: BlockManagerId,  // Note that bmAddress can be null
+    bmAddress: Location,  // Note that bmAddress can be null
     shuffleId: Int,
     mapId: Long,
     mapIndex: Int,

diff --git a/core/src/main/scala/org/apache/spark/scheduler/MapStatus.scala b/core/src/main/scala/org/apache/spark/scheduler/MapStatus.scala
@@ -28,16 +28,23 @@ import org.apache.spark.internal.config
 import org.apache.spark.storage.BlockManagerId
 import org.apache.spark.util.Utils
 
+trait Location extends Externalizable {
 override def writeExternal(out: ObjectOutput): Unit = Utils.tryOrIOException { 
   out.writeUTF(executorId_) 
   out.writeUTF(host_) 
   out.writeInt(port_) 
   out.writeBoolean(topologyInfo_.isDefined) 
   // we only write topologyInfo if we have it 
   topologyInfo.foreach(out.writeUTF(_)) 
 } 
 override def readExternal(in: ObjectInput): Unit = Utils.tryOrIOException { 
   executorId_ = in.readUTF() 
   host_ = in.readUTF() 
   port_ = in.readInt() 
   val isTopologyInfoAvailable = in.readBoolean() 
   topologyInfo_ = if (isTopologyInfoAvailable) Option(in.readUTF()) else None 
 } 
 override def writeExternal(out: ObjectOutput): Unit = Utils.tryOrIOException { 
   out.writeUTF(executorId_) 
   out.writeUTF(host_) 
   out.writeInt(port_) 
   out.writeBoolean(topologyInfo_.isDefined) 
   // we only write topologyInfo if we have it 
   topologyInfo.foreach(out.writeUTF(_)) 
 } 
  
 override def readExternal(in: ObjectInput): Unit = Utils.tryOrIOException { 
   executorId_ = in.readUTF() 
   host_ = in.readUTF() 
   port_ = in.readInt() 
   val isTopologyInfoAvailable = in.readBoolean() 
   topologyInfo_ = if (isTopologyInfoAvailable) Option(in.readUTF()) else None 
 } 
+  def host: String
+  def port: Int
+  def hostPort: String
+  def executorId: String = "unknown"
+}
+
 /**
  * Result returned by a ShuffleMapTask to a scheduler. Includes the block manager address that the
  * task has shuffle files stored on as well as the sizes of outputs for each reducer, for passing
  * on to the reduce tasks.
  */
 private[spark] sealed trait MapStatus {
   /** Location where this task output is. */
-  def location: BlockManagerId
+  def location: Location
 
-  def updateLocation(newLoc: BlockManagerId): Unit
+  def updateLocation(newLoc: Location): Unit
 
   /**
    * Estimated size for the reduce block, in bytes.
@@ -66,7 +73,7 @@ private[spark] object MapStatus {
     .getOrElse(config.SHUFFLE_MIN_NUM_PARTS_TO_HIGHLY_COMPRESS.defaultValue.get)
 
   def apply(
-      loc: BlockManagerId,
+      loc: Location,
       uncompressedSizes: Array[Long],
       mapTaskId: Long): MapStatus = {
     if (uncompressedSizes.length > minPartitionsToUseHighlyCompressMapStatus) {
@@ -115,21 +122,21 @@ private[spark] object MapStatus {
  * @param _mapTaskId unique task id for the task
  */
 private[spark] class CompressedMapStatus(
-    private[this] var loc: BlockManagerId,
+    private[this] var loc: Location,
     private[this] var compressedSizes: Array[Byte],
     private[this] var _mapTaskId: Long)
   extends MapStatus with Externalizable {
 
   // For deserialization only
   protected def this() = this(null, null.asInstanceOf[Array[Byte]], -1)
 
-  def this(loc: BlockManagerId, uncompressedSizes: Array[Long], mapTaskId: Long) = {
+  def this(loc: Location, uncompressedSizes: Array[Long], mapTaskId: Long) = {
     this(loc, uncompressedSizes.map(MapStatus.compressSize), mapTaskId)
   }
 
-  override def location: BlockManagerId = loc
+  override def location: Location = loc
 
-  override def updateLocation(newLoc: BlockManagerId): Unit = {
+  override def updateLocation(newLoc: Location): Unit = {
     loc = newLoc
   }
 
@@ -168,7 +175,7 @@ private[spark] class CompressedMapStatus(
  * @param _mapTaskId unique task id for the task
  */
 private[spark] class HighlyCompressedMapStatus private (
-    private[this] var loc: BlockManagerId,
+    private[this] var loc: Location,
     private[this] var numNonEmptyBlocks: Int,
     private[this] var emptyBlocks: RoaringBitmap,
     private[this] var avgSize: Long,
@@ -183,9 +190,9 @@ private[spark] class HighlyCompressedMapStatus private (
 
   protected def this() = this(null, -1, null, -1, null, -1)  // For deserialization only
 
-  override def location: BlockManagerId = loc
+  override def location: Location = loc
 
-  override def updateLocation(newLoc: BlockManagerId): Unit = {
+  override def updateLocation(newLoc: Location): Unit = {
     loc = newLoc
   }
 
@@ -216,7 +223,10 @@ private[spark] class HighlyCompressedMapStatus private (
   }
 
   override def readExternal(in: ObjectInput): Unit = Utils.tryOrIOException {
-    loc = BlockManagerId(in)
+    // TODO(wuyi): config
+    val location = "org.apache.spark.storage.BlockManagerId"
+    loc = Utils.classForName(location).newInstance().asInstanceOf[Location]
+    loc.readExternal(in)
     numNonEmptyBlocks = -1 // SPARK-32436 Scala 2.13 doesn't initialize this during deserialization
     emptyBlocks = new RoaringBitmap()
     emptyBlocks.deserialize(in)
@@ -235,7 +245,7 @@ private[spark] class HighlyCompressedMapStatus private (
 
 private[spark] object HighlyCompressedMapStatus {
   def apply(
-      loc: BlockManagerId,
+      loc: Location,
       uncompressedSizes: Array[Long],
       mapTaskId: Long): HighlyCompressedMapStatus = {
     // We must keep track of which blocks are empty so that we don't report a zero-sized

diff --git a/core/src/main/scala/org/apache/spark/shuffle/BlockStoreShuffleReader.scala b/core/src/main/scala/org/apache/spark/shuffle/BlockStoreShuffleReader.scala
@@ -20,8 +20,9 @@ package org.apache.spark.shuffle
 import org.apache.spark._
 import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.io.CompressionCodec
+import org.apache.spark.scheduler.Location
 import org.apache.spark.serializer.SerializerManager
-import org.apache.spark.storage.{BlockId, BlockManager, BlockManagerId, ShuffleBlockFetcherIterator}
+import org.apache.spark.storage.{BlockId, BlockManager, ShuffleBlockFetcherIterator}
 import org.apache.spark.util.CompletionIterator
 import org.apache.spark.util.collection.ExternalSorter
 
@@ -30,7 +31,7 @@ import org.apache.spark.util.collection.ExternalSorter
  */
 private[spark] class BlockStoreShuffleReader[K, C](
     handle: BaseShuffleHandle[K, _, C],
-    blocksByAddress: Iterator[(BlockManagerId, Seq[(BlockId, Long, Int)])],
+    blocksByAddress: Iterator[(Location, Seq[(BlockId, Long, Int)])],
     context: TaskContext,
     readMetrics: ShuffleReadMetricsReporter,
     serializerManager: SerializerManager = SparkEnv.get.serializerManager,

diff --git a/core/src/main/scala/org/apache/spark/shuffle/FetchFailedException.scala b/core/src/main/scala/org/apache/spark/shuffle/FetchFailedException.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.shuffle
 
 import org.apache.spark.{FetchFailed, TaskContext, TaskFailedReason}
-import org.apache.spark.storage.BlockManagerId
+import org.apache.spark.scheduler.Location
 import org.apache.spark.util.Utils
 
 /**
@@ -33,7 +33,7 @@ import org.apache.spark.util.Utils
  * (or risk triggering any other exceptions).  See SPARK-19276.
  */
 private[spark] class FetchFailedException(
-    bmAddress: BlockManagerId,
+    bmAddress: Location,
     shuffleId: Int,
     mapId: Long,
     mapIndex: Int,
@@ -43,7 +43,7 @@ private[spark] class FetchFailedException(
   extends Exception(message, cause) {
 
   def this(
-      bmAddress: BlockManagerId,
+      bmAddress: Location,
       shuffleId: Int,
       mapTaskId: Long,
       mapIndex: Int,

diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManagerId.scala b/core/src/main/scala/org/apache/spark/storage/BlockManagerId.scala
@@ -17,12 +17,14 @@
 
 package org.apache.spark.storage
 
-import java.io.{Externalizable, IOException, ObjectInput, ObjectOutput}
+import java.io.{IOException, ObjectInput, ObjectOutput}
 
 import com.google.common.cache.{CacheBuilder, CacheLoader}
 
 import org.apache.spark.SparkContext
 import org.apache.spark.annotation.DeveloperApi
+import org.apache.spark.scheduler.Location
+import org.apache.spark.storage.BlockManagerId.getCachedBlockManagerId
 import org.apache.spark.util.Utils
 
 /**
@@ -40,27 +42,27 @@ class BlockManagerId private (
     private var host_ : String,
     private var port_ : Int,
     private var topologyInfo_ : Option[String])
-  extends Externalizable {
+  extends Location {
 
   private def this() = this(null, null, 0, None)  // For deserialization only
 
-  def executorId: String = executorId_
+  override def executorId: String = executorId_
 
   if (null != host_) {
     Utils.checkHost(host_)
     assert (port_ > 0)
   }
 
-  def hostPort: String = {
+  override def hostPort: String = {
     // DEBUG code
     Utils.checkHost(host)
     assert (port > 0)
     host + ":" + port
   }
 
-  def host: String = host_
+  override def host: String = host_
 
-  def port: Int = port_
+  override def port: Int = port_
 
   def topologyInfo: Option[String] = topologyInfo_
 
@@ -83,6 +85,7 @@ class BlockManagerId private (
     port_ = in.readInt()
     val isTopologyInfoAvailable = in.readBoolean()
     topologyInfo_ = if (isTopologyInfoAvailable) Option(in.readUTF()) else None
+    getCachedBlockManagerId(this)
   }
 
   @throws(classOf[IOException])
@@ -129,7 +132,7 @@ private[spark] object BlockManagerId {
   def apply(in: ObjectInput): BlockManagerId = {
     val obj = new BlockManagerId()
     obj.readExternal(in)
-    getCachedBlockManagerId(obj)
+    obj
   }
 
   /**