From cad6a1fa6f8e0dc2cd89adb561711b22acf0ebdb Mon Sep 17 00:00:00 2001
From: Jungtaek Lim <kabhwan@gmail.com>
Date: Fri, 17 Aug 2018 18:56:31 +0900
Subject: [PATCH 01/13] [SPARK-25151][SS] Apply Apache Commons Pool to
 KafkaDataConsumer

* Fix scala style check violation
* Add commons-pool2 version property to root pom.xml
* Address eviction to pool which enables cleaning up idle consumers
* Fix missed spots
* New approach: pool both kafka consumers and fetched data individually
** This approach enables applying different policies on pool
** This approach also enables evicting consumers and fetched data for invalid topics/partitions
** This approach can handle the case which multiple tasks access same topic partition and group id
* Address review comments from @gaborgsomogyi
* Address another review comments on @gaborgsomogyi
* Fix silly mistake
* Add sanity/edge-case tests on KafkaDataConsumer
** also add basic metrics to verify behavior on fetched pool
* Apply new fetched data pool metrics to unit tests in FetchedDataPoolSuite
* Fix test failures (forgot to reset TestContext)
* Address another review comments from @gaborgsomogyi
* Try best-effort to isolate environments for UTs
* Fix scalastyle
* Reflect low-hanging fruits review comments
* Use ConfigBuilder, rename config, etc.
* Address build failure because of class rename
* Address review comment
---
 external/kafka-0-10-sql/pom.xml               |   5 +
 .../spark/sql/kafka010/FetchedDataPool.scala  | 190 +++++
 .../kafka010/InternalKafkaConsumerPool.scala  | 226 ++++++
 .../spark/sql/kafka010/KafkaBatch.scala       |   2 +-
 .../kafka010/KafkaBatchPartitionReader.scala  |  11 +-
 .../sql/kafka010/KafkaContinuousStream.scala  |   2 +-
 .../sql/kafka010/KafkaDataConsumer.scala      | 677 +++++++++---------
 .../sql/kafka010/KafkaMicroBatchStream.scala  |   7 +-
 .../spark/sql/kafka010/KafkaRelation.scala    |   2 +-
 .../spark/sql/kafka010/KafkaSource.scala      |   3 +-
 .../spark/sql/kafka010/KafkaSourceRDD.scala   |   5 +-
 .../apache/spark/sql/kafka010/package.scala   |  21 +
 .../sql/kafka010/FetchedDataPoolSuite.scala   | 337 +++++++++
 .../InternalKafkaConsumerPoolSuite.scala      | 316 ++++++++
 .../sql/kafka010/KafkaDataConsumerSuite.scala | 203 +++++-
 .../kafka010/KafkaMicroBatchSourceSuite.scala |   1 -
 pom.xml                                       |   2 +
 17 files changed, 1617 insertions(+), 393 deletions(-)
 create mode 100644 external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
 create mode 100644 external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
 create mode 100644 external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
 create mode 100644 external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
diff --git a/external/kafka-0-10-sql/pom.xml b/external/kafka-0-10-sql/pom.xml
index 827ceb89a0c3..feba787e9901 100644
--- a/external/kafka-0-10-sql/pom.xml
+++ b/external/kafka-0-10-sql/pom.xml
@@ -72,6 +72,11 @@
       <artifactId>kafka-clients</artifactId>
       <version>${kafka.version}</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.commons</groupId>
+      <artifactId>commons-pool2</artifactId>
+      <version>${commons-pool2.version}</version>
+    </dependency>
     <dependency>
       <groupId>org.apache.kafka</groupId>
       <artifactId>kafka_${scala.binary.version}</artifactId>
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
new file mode 100644
index 000000000000..a408c27d21f8
--- /dev/null
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -0,0 +1,190 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.kafka010
+
+import java.{util => ju}
+import java.util.concurrent.{ScheduledFuture, TimeUnit}
+import java.util.concurrent.atomic.LongAdder
+
+import scala.collection.mutable
+import scala.util.control.NonFatal
+
+import org.apache.kafka.clients.consumer.ConsumerRecord
+
+import org.apache.spark.SparkEnv
+import org.apache.spark.internal.Logging
+import org.apache.spark.sql.kafka010.KafkaDataConsumer.{CacheKey, UNKNOWN_OFFSET}
+import org.apache.spark.util.ThreadUtils
+
+/**
+ * Provides object pool for [[FetchedData]] which is grouped by [[CacheKey]].
+ *
+ * Along with CacheKey, it receives desired start offset to find cached FetchedData which
+ * may be stored from previous batch. If it can't find one to match, it will create
+ * a new FetchedData.
+ */
+private[kafka010] class FetchedDataPool extends Logging {
+  import FetchedDataPool._
+
+  private val cache: mutable.Map[CacheKey, CachedFetchedDataList] = mutable.HashMap.empty
+
+  private val (minEvictableIdleTimeMillis, evictorThreadRunIntervalMillis): (Long, Long) = {
+    val conf = SparkEnv.get.conf
+
+    val minEvictIdleTime = conf.getLong(CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS,
+      DEFAULT_VALUE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
+
+    val evictorThreadInterval = conf.getLong(
+      CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS,
+      DEFAULT_VALUE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
+
+    (minEvictIdleTime, evictorThreadInterval)
+  }
+
+  private val executorService = ThreadUtils.newDaemonSingleThreadScheduledExecutor(
+    "kafka-fetched-data-cache-evictor")
+
+  private def startEvictorThread(): ScheduledFuture[_] = {
+    executorService.scheduleAtFixedRate(new Runnable {
+      override def run(): Unit = {
+        try {
+          removeIdleFetchedData()
+        } catch {
+          case NonFatal(e) =>
+            logWarning("Exception occurred while removing idle fetched data.", e)
+        }
+      }
+    }, 0, evictorThreadRunIntervalMillis, TimeUnit.MILLISECONDS)
+  }
+
+  private var scheduled = startEvictorThread()
+
+  private val numCreatedFetchedData = new LongAdder()
+  private val numTotalElements = new LongAdder()
+
+  def getNumCreated: Long = numCreatedFetchedData.sum()
+  def getNumTotal: Long = numTotalElements.sum()
+
+  def acquire(key: CacheKey, desiredStartOffset: Long): FetchedData = synchronized {
+    val fetchedDataList = cache.getOrElseUpdate(key, new CachedFetchedDataList())
+
+    val cachedFetchedDataOption = fetchedDataList.find { p =>
+      !p.inUse && p.getObject.nextOffsetInFetchedData == desiredStartOffset
+    }
+
+    var cachedFetchedData: CachedFetchedData = null
+    if (cachedFetchedDataOption.isDefined) {
+      cachedFetchedData = cachedFetchedDataOption.get
+    } else {
+      cachedFetchedData = CachedFetchedData.empty()
+      fetchedDataList += cachedFetchedData
+
+      numCreatedFetchedData.increment()
+      numTotalElements.increment()
+    }
+
+    cachedFetchedData.lastAcquiredTimestamp = System.currentTimeMillis()
+    cachedFetchedData.inUse = true
+
+    cachedFetchedData.getObject
+  }
+
+  def invalidate(key: CacheKey): Unit = synchronized {
+    cache.remove(key) match {
+      case Some(lst) => numTotalElements.add(-1 * lst.size)
+      case None =>
+    }
+  }
+
+  def release(key: CacheKey, fetchedData: FetchedData): Unit = synchronized {
+    cache.get(key) match {
+      case Some(fetchedDataList) =>
+        val cachedFetchedDataOption = fetchedDataList.find { p =>
+          p.inUse && p.getObject == fetchedData
+        }
+
+        if (cachedFetchedDataOption.isDefined) {
+          val cachedFetchedData = cachedFetchedDataOption.get
+          cachedFetchedData.inUse = false
+          cachedFetchedData.lastReleasedTimestamp = System.currentTimeMillis()
+        }
+
+      case None => logWarning(s"No matching data in pool for $fetchedData in key $key. " +
+        "It might be released before, or it was not a part of pool.")
+    }
+  }
+
+  def shutdown(): Unit = {
+    executorService.shutdownNow()
+  }
+
+  def reset(): Unit = synchronized {
+    scheduled.cancel(true)
+
+    cache.clear()
+    numTotalElements.reset()
+    numCreatedFetchedData.reset()
+
+    scheduled = startEvictorThread()
+  }
+
+  private def removeIdleFetchedData(): Unit = synchronized {
+    val timestamp = System.currentTimeMillis()
+    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeMillis
+    cache.values.foreach { p: CachedFetchedDataList =>
+      val idles = p.filter(q => !q.inUse && q.lastReleasedTimestamp < maxAllowedIdleTimestamp)
+      val lstSize = p.size
+      idles.foreach(idle => p -= idle)
+      numTotalElements.add(-1 * (lstSize - p.size))
+    }
+  }
+}
+
+private[kafka010] object FetchedDataPool {
+  private[kafka010] case class CachedFetchedData(fetchedData: FetchedData) {
+    var lastReleasedTimestamp: Long = Long.MaxValue
+    var lastAcquiredTimestamp: Long = Long.MinValue
+    var inUse: Boolean = false
+
+    def getObject: FetchedData = fetchedData
+  }
+
+  private object CachedFetchedData {
+    def empty(): CachedFetchedData = {
+      val emptyData = FetchedData(
+        ju.Collections.emptyListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
+        UNKNOWN_OFFSET,
+        UNKNOWN_OFFSET)
+
+      CachedFetchedData(emptyData)
+    }
+  }
+
+  private[kafka010] type CachedFetchedDataList = mutable.ListBuffer[CachedFetchedData]
+
+  val CONFIG_NAME_PREFIX = "spark.sql.kafkaFetchedDataCache."
+  val CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS = CONFIG_NAME_PREFIX +
+    "minEvictableIdleTimeMillis"
+  val CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS = CONFIG_NAME_PREFIX +
+    "evictorThreadRunIntervalMillis"
+
+  val DEFAULT_VALUE_MIN_EVICTABLE_IDLE_TIME_MILLIS = 10 * 60 * 1000 // 10 minutes
+  val DEFAULT_VALUE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS = 5 * 60 * 1000 // 3 minutes
+
+  def build: FetchedDataPool = new FetchedDataPool()
+}
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
new file mode 100644
index 000000000000..f268508a7c61
--- /dev/null
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
@@ -0,0 +1,226 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.kafka010
+
+import java.{util => ju}
+import java.util.concurrent.ConcurrentHashMap
+
+import org.apache.commons.pool2.{BaseKeyedPooledObjectFactory, PooledObject, SwallowedExceptionListener}
+import org.apache.commons.pool2.impl.{DefaultEvictionPolicy, DefaultPooledObject, GenericKeyedObjectPool, GenericKeyedObjectPoolConfig}
+
+import org.apache.spark.SparkEnv
+import org.apache.spark.internal.Logging
+import org.apache.spark.sql.kafka010.InternalKafkaConsumerPool._
+import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
+
+/**
+ * Provides object pool for [[InternalKafkaConsumer]] which is grouped by [[CacheKey]].
+ *
+ * This class leverages [[GenericKeyedObjectPool]] internally, hence providing methods based on
+ * the class, and same contract applies: after using the borrowed object, you must either call
+ * returnObject() if the object is healthy to return to pool, or invalidateObject() if the object
+ * should be destroyed.
+ *
+ * The soft capacity of pool is determined by "spark.sql.kafkaConsumerCache.capacity" config value,
+ * and the pool will have reasonable default value if the value is not provided.
+ * (The instance will do its best effort to respect soft capacity but it can exceed when there's
+ * a borrowing request and there's neither free space nor idle object to clear.)
+ *
+ * This class guarantees that no caller will get pooled object once the object is borrowed and
+ * not yet returned, hence provide thread-safety usage of non-thread-safe [[InternalKafkaConsumer]]
+ * unless caller shares the object to multiple threads.
+ */
+private[kafka010] class InternalKafkaConsumerPool(
+    objectFactory: ObjectFactory,
+    poolConfig: PoolConfig) {
+
+  // the class is intended to have only soft capacity
+  assert(poolConfig.getMaxTotal < 0)
+
+  private lazy val pool = {
+    val internalPool = new GenericKeyedObjectPool[CacheKey, InternalKafkaConsumer](
+      objectFactory, poolConfig)
+    internalPool.setSwallowedExceptionListener(CustomSwallowedExceptionListener)
+    internalPool
+  }
+
+  /**
+   * Borrows [[InternalKafkaConsumer]] object from the pool. If there's no idle object for the key,
+   * the pool will create the [[InternalKafkaConsumer]] object.
+   *
+   * If the pool doesn't have idle object for the key and also exceeds the soft capacity,
+   * pool will try to clear some of idle objects.
+   *
+   * Borrowed object must be returned by either calling returnObject or invalidateObject, otherwise
+   * the object will be kept in pool as active object.
+   */
+  def borrowObject(key: CacheKey, kafkaParams: ju.Map[String, Object]): InternalKafkaConsumer = {
+    updateKafkaParamForKey(key, kafkaParams)
+
+    if (getTotal == poolConfig.getSoftMaxTotal()) {
+      pool.clearOldest()
+    }
+
+    pool.borrowObject(key)
+  }
+
+  /** Returns borrowed object to the pool. */
+  def returnObject(consumer: InternalKafkaConsumer): Unit = {
+    pool.returnObject(extractCacheKey(consumer), consumer)
+  }
+
+  /** Invalidates (destroy) borrowed object to the pool. */
+  def invalidateObject(consumer: InternalKafkaConsumer): Unit = {
+    pool.invalidateObject(extractCacheKey(consumer), consumer)
+  }
+
+  /** Invalidates all idle consumers for the key */
+  def invalidateKey(key: CacheKey): Unit = {
+    pool.clear(key)
+  }
+
+  /**
+   * Closes the keyed object pool. Once the pool is closed,
+   * borrowObject will fail with [[IllegalStateException]], but returnObject and invalidateObject
+   * will continue to work, with returned objects destroyed on return.
+   *
+   * Also destroys idle instances in the pool.
+   */
+  def close(): Unit = {
+    pool.close()
+  }
+
+  def reset(): Unit = {
+    // this is the best-effort of clearing up. otherwise we should close the pool and create again
+    // but we don't want to make it "var" only because of tests.
+    pool.clear()
+  }
+
+  def getNumIdle: Int = pool.getNumIdle
+
+  def getNumIdle(key: CacheKey): Int = pool.getNumIdle(key)
+
+  def getNumActive: Int = pool.getNumActive
+
+  def getNumActive(key: CacheKey): Int = pool.getNumActive(key)
+
+  def getTotal: Int = getNumIdle + getNumActive
+
+  def getTotal(key: CacheKey): Int = getNumIdle(key) + getNumActive(key)
+
+  private def updateKafkaParamForKey(key: CacheKey, kafkaParams: ju.Map[String, Object]): Unit = {
+    // We can assume that kafkaParam should not be different for same cache key,
+    // otherwise we can't reuse the cached object and cache key should contain kafkaParam.
+    // So it should be safe to put the key/value pair only when the key doesn't exist.
+    val oldKafkaParams = objectFactory.keyToKafkaParams.putIfAbsent(key, kafkaParams)
+    require(oldKafkaParams == null || kafkaParams == oldKafkaParams, "Kafka parameters for same " +
+      s"cache key should be equal. old parameters: $oldKafkaParams new parameters: $kafkaParams")
+  }
+
+  private def extractCacheKey(consumer: InternalKafkaConsumer): CacheKey = {
+    new CacheKey(consumer.topicPartition, consumer.kafkaParams)
+  }
+}
+
+private[kafka010] object InternalKafkaConsumerPool {
+
+  /**
+   * Builds the pool for [[InternalKafkaConsumer]]. The pool instance is created per each call.
+   */
+  def build: InternalKafkaConsumerPool = {
+    val objFactory = new ObjectFactory
+    val poolConfig = new PoolConfig
+    new InternalKafkaConsumerPool(objFactory, poolConfig)
+  }
+
+  object CustomSwallowedExceptionListener extends SwallowedExceptionListener with Logging {
+    override def onSwallowException(e: Exception): Unit = {
+      logError(s"Error closing Kafka consumer", e)
+    }
+  }
+
+  class PoolConfig extends GenericKeyedObjectPoolConfig[InternalKafkaConsumer] {
+    private var softMaxTotal = Int.MaxValue
+
+    def getSoftMaxTotal(): Int = softMaxTotal
+
+    init()
+
+    def init(): Unit = {
+      val conf = SparkEnv.get.conf
+
+      softMaxTotal = conf.get(CONSUMER_CACHE_CAPACITY)
+
+      val jmxEnabled = conf.get(CONSUMER_CACHE_JMX_ENABLED)
+      val minEvictableIdleTimeMillis = conf.get(CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
+      val evictorThreadRunIntervalMillis = conf.get(
+        CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
+
+      // NOTE: Below lines define the behavior, so do not modify unless you know what you are
+      // doing, and update the class doc accordingly if necessary when you modify.
+
+      // 1. Set min idle objects per key to 0 to avoid creating unnecessary object.
+      // 2. Set max idle objects per key to 3 but set total objects per key to infinite
+      // which ensures borrowing per key is not restricted.
+      // 3. Set max total objects to infinite which ensures all objects are managed in this pool.
+      setMinIdlePerKey(0)
+      setMaxIdlePerKey(3)
+      setMaxTotalPerKey(-1)
+      setMaxTotal(-1)
+
+      // Set minimum evictable idle time which will be referred from evictor thread
+      setMinEvictableIdleTimeMillis(minEvictableIdleTimeMillis)
+      setSoftMinEvictableIdleTimeMillis(-1)
+
+      // evictor thread will run test with ten idle objects
+      setTimeBetweenEvictionRunsMillis(evictorThreadRunIntervalMillis)
+      setNumTestsPerEvictionRun(10)
+      setEvictionPolicy(new DefaultEvictionPolicy[InternalKafkaConsumer]())
+
+      // Immediately fail on exhausted pool while borrowing
+      setBlockWhenExhausted(false)
+
+      setJmxEnabled(jmxEnabled)
+      setJmxNamePrefix("kafka010-cached-simple-kafka-consumer-pool")
+    }
+  }
+
+  class ObjectFactory extends BaseKeyedPooledObjectFactory[CacheKey, InternalKafkaConsumer]
+    with Logging {
+
+    val keyToKafkaParams: ConcurrentHashMap[CacheKey, ju.Map[String, Object]] =
+      new ConcurrentHashMap[CacheKey, ju.Map[String, Object]]()
+
+    override def create(key: CacheKey): InternalKafkaConsumer = {
+      Option(keyToKafkaParams.get(key)) match {
+        case Some(kafkaParams) => new InternalKafkaConsumer(key.topicPartition, kafkaParams)
+        case None => throw new IllegalStateException("Kafka params should be set before " +
+          "borrowing object.")
+      }
+    }
+
+    override def wrap(value: InternalKafkaConsumer): PooledObject[InternalKafkaConsumer] = {
+      new DefaultPooledObject[InternalKafkaConsumer](value)
+    }
+
+    override def destroyObject(key: CacheKey, p: PooledObject[InternalKafkaConsumer]): Unit = {
+      p.getObject.close()
+    }
+  }
+}
+
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatch.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatch.scala
index 839a64ed3132..700414167f3e 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatch.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatch.scala
@@ -91,7 +91,7 @@ private[kafka010] class KafkaBatch(
       KafkaSourceProvider.kafkaParamsForExecutors(specifiedKafkaParams, uniqueGroupId)
     offsetRanges.map { range =>
       new KafkaBatchInputPartition(
-        range, executorKafkaParams, pollTimeoutMs, failOnDataLoss, false)
+        range, executorKafkaParams, pollTimeoutMs, failOnDataLoss)
     }.toArray
   }
 
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
index cbc2fbfce319..53b0b3c46854 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
@@ -30,14 +30,13 @@ private[kafka010] case class KafkaBatchInputPartition(
     offsetRange: KafkaOffsetRange,
     executorKafkaParams: ju.Map[String, Object],
     pollTimeoutMs: Long,
-    failOnDataLoss: Boolean,
-    reuseKafkaConsumer: Boolean) extends InputPartition
+    failOnDataLoss: Boolean) extends InputPartition
 
 private[kafka010] object KafkaBatchReaderFactory extends PartitionReaderFactory {
   override def createReader(partition: InputPartition): PartitionReader[InternalRow] = {
     val p = partition.asInstanceOf[KafkaBatchInputPartition]
     KafkaBatchPartitionReader(p.offsetRange, p.executorKafkaParams, p.pollTimeoutMs,
-      p.failOnDataLoss, p.reuseKafkaConsumer)
+      p.failOnDataLoss)
   }
 }
 
@@ -46,11 +45,9 @@ private case class KafkaBatchPartitionReader(
     offsetRange: KafkaOffsetRange,
     executorKafkaParams: ju.Map[String, Object],
     pollTimeoutMs: Long,
-    failOnDataLoss: Boolean,
-    reuseKafkaConsumer: Boolean) extends PartitionReader[InternalRow] with Logging {
+    failOnDataLoss: Boolean) extends PartitionReader[InternalRow] with Logging {
 
-  private val consumer = KafkaDataConsumer.acquire(
-    offsetRange.topicPartition, executorKafkaParams, reuseKafkaConsumer)
+  private val consumer = KafkaDataConsumer.acquire(offsetRange.topicPartition, executorKafkaParams)
 
   private val rangeToRead = resolveRange(offsetRange)
   private val converter = new KafkaRecordToUnsafeRowConverter
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
index 18d740eaa968..a9c1181a01c5 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
@@ -185,7 +185,7 @@ class KafkaContinuousPartitionReader(
     kafkaParams: ju.Map[String, Object],
     pollTimeoutMs: Long,
     failOnDataLoss: Boolean) extends ContinuousPartitionReader[InternalRow] {
-  private val consumer = KafkaDataConsumer.acquire(topicPartition, kafkaParams, useCache = false)
+  private val consumer = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
   private val converter = new KafkaRecordToUnsafeRowConverter
 
   private var nextKafkaOffset = startOffset
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
index af240dc04eea..9e98ae562937 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.kafka010
 
 import java.{util => ju}
+import java.io.Closeable
 import java.util.concurrent.TimeoutException
 
 import scala.collection.JavaConverters._
@@ -25,169 +26,200 @@ import scala.collection.JavaConverters._
 import org.apache.kafka.clients.consumer.{ConsumerConfig, ConsumerRecord, KafkaConsumer, OffsetOutOfRangeException}
 import org.apache.kafka.common.TopicPartition
 
-import org.apache.spark.{SparkEnv, SparkException, TaskContext}
+import org.apache.spark.TaskContext
 import org.apache.spark.internal.Logging
 import org.apache.spark.kafka010.KafkaConfigUpdater
-import org.apache.spark.sql.kafka010.KafkaDataConsumer.AvailableOffsetRange
+import org.apache.spark.sql.kafka010.KafkaDataConsumer.{AvailableOffsetRange, UNKNOWN_OFFSET}
 import org.apache.spark.sql.kafka010.KafkaSourceProvider._
-import org.apache.spark.util.UninterruptibleThread
+import org.apache.spark.util.{ShutdownHookManager, UninterruptibleThread}
+
+/**
+ * This class simplifies the usages of Kafka consumer in Spark SQL Kafka connector.
+ *
+ * NOTE: Like KafkaConsumer, this class is not thread-safe.
+ * NOTE for contributors: It is possible for the instance to be used from multiple callers,
+ * so all the methods should not rely on current cursor and use seek manually.
+ */
+private[kafka010] class InternalKafkaConsumer(
+    val topicPartition: TopicPartition,
+    val kafkaParams: ju.Map[String, Object]) extends Closeable with Logging {
+
+  val groupId = kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String]
+
+  private val consumer = createConsumer
 
-private[kafka010] sealed trait KafkaDataConsumer {
   /**
-   * Get the record for the given offset if available.
-   *
-   * If the record is invisible (either a
-   * transaction message, or an aborted message when the consumer's `isolation.level` is
-   * `read_committed`), it will be skipped and this method will try to fetch next available record
-   * within [offset, untilOffset).
+   * Poll messages from Kafka starting from `offset` and returns a pair of "list of consumer record"
+   * and "offset after poll". The list of consumer record may be empty if the Kafka consumer fetches
+   * some messages but all of them are not visible messages (either transaction messages,
+   * or aborted messages when `isolation.level` is `read_committed`).
    *
-   * This method also will try its best to detect data loss. If `failOnDataLoss` is `true`, it will
-   * throw an exception when we detect an unavailable offset. If `failOnDataLoss` is `false`, this
-   * method will try to fetch next available record within [offset, untilOffset).
-   *
-   * When this method tries to skip offsets due to either invisible messages or data loss and
-   * reaches `untilOffset`, it will return `null`.
-   *
-   * @param offset         the offset to fetch.
-   * @param untilOffset    the max offset to fetch. Exclusive.
-   * @param pollTimeoutMs  timeout in milliseconds to poll data from Kafka.
-   * @param failOnDataLoss When `failOnDataLoss` is `true`, this method will either return record at
-   *                       offset if available, or throw exception.when `failOnDataLoss` is `false`,
-   *                       this method will either return record at offset if available, or return
-   *                       the next earliest available record less than untilOffset, or null. It
-   *                       will not throw any exception.
+   * @throws OffsetOutOfRangeException if `offset` is out of range.
+   * @throws TimeoutException if the consumer position is not changed after polling. It means the
+   *                          consumer polls nothing before timeout.
    */
-  def get(
-      offset: Long,
-      untilOffset: Long,
-      pollTimeoutMs: Long,
-      failOnDataLoss: Boolean): ConsumerRecord[Array[Byte], Array[Byte]] = {
-    internalConsumer.get(offset, untilOffset, pollTimeoutMs, failOnDataLoss)
+  def fetch(offset: Long, pollTimeoutMs: Long):
+    (ju.List[ConsumerRecord[Array[Byte], Array[Byte]]], Long) = {
+
+    // Seek to the offset because we may call seekToBeginning or seekToEnd before this.
+    seek(offset)
+    val p = consumer.poll(pollTimeoutMs)
+    val r = p.records(topicPartition)
+    logDebug(s"Polled $groupId ${p.partitions()}  ${r.size}")
+    val offsetAfterPoll = consumer.position(topicPartition)
+    logDebug(s"Offset changed from $offset to $offsetAfterPoll after polling")
+    val fetchedData = (r, offsetAfterPoll)
+    if (r.isEmpty) {
+      // We cannot fetch anything after `poll`. Two possible cases:
+      // - `offset` is out of range so that Kafka returns nothing. `OffsetOutOfRangeException` will
+      //   be thrown.
+      // - Cannot fetch any data before timeout. `TimeoutException` will be thrown.
+      // - Fetched something but all of them are not invisible. This is a valid case and let the
+      //   caller handles this.
+      val range = getAvailableOffsetRange()
+      if (offset < range.earliest || offset >= range.latest) {
+        throw new OffsetOutOfRangeException(
+          Map(topicPartition -> java.lang.Long.valueOf(offset)).asJava)
+      } else if (offset == offsetAfterPoll) {
+        throw new TimeoutException(
+          s"Cannot fetch record for offset $offset in $pollTimeoutMs milliseconds")
+      }
+    }
+    fetchedData
   }
 
   /**
    * Return the available offset range of the current partition. It's a pair of the earliest offset
    * and the latest offset.
    */
-  def getAvailableOffsetRange(): AvailableOffsetRange = internalConsumer.getAvailableOffsetRange()
+  def getAvailableOffsetRange(): AvailableOffsetRange = {
+    consumer.seekToBeginning(Set(topicPartition).asJava)
+    val earliestOffset = consumer.position(topicPartition)
+    consumer.seekToEnd(Set(topicPartition).asJava)
+    val latestOffset = consumer.position(topicPartition)
+    AvailableOffsetRange(earliestOffset, latestOffset)
+  }
 
-  /**
-   * Release this consumer from being further used. Depending on its implementation,
-   * this consumer will be either finalized, or reset for reuse later.
-   */
-  def release(): Unit
+  override def close(): Unit = {
+    consumer.close()
+  }
 
-  /** Reference to the internal implementation that this wrapper delegates to */
-  def internalConsumer: InternalKafkaConsumer
-}
+  /** Create a KafkaConsumer to fetch records for `topicPartition` */
+  private def createConsumer: KafkaConsumer[Array[Byte], Array[Byte]] = {
+    val updatedKafkaParams = KafkaConfigUpdater("executor", kafkaParams.asScala.toMap)
+      .setAuthenticationConfigIfNeeded()
+      .build()
+    val c = new KafkaConsumer[Array[Byte], Array[Byte]](updatedKafkaParams)
+    val tps = new ju.ArrayList[TopicPartition]()
+    tps.add(topicPartition)
+    c.assign(tps)
+    c
+  }
 
+  private def seek(offset: Long): Unit = {
+    logDebug(s"Seeking to $groupId $topicPartition $offset")
+    consumer.seek(topicPartition, offset)
+  }
+}
 
 /**
- * A wrapper around Kafka's KafkaConsumer that throws error when data loss is detected.
- * This is not for direct use outside this file.
+ * The internal object to store the fetched data from Kafka consumer and the next offset to poll.
+ *
+ * @param _records the pre-fetched Kafka records.
+ * @param _nextOffsetInFetchedData the next offset in `records`. We use this to verify if we
+ *                                 should check if the pre-fetched data is still valid.
+ * @param _offsetAfterPoll the Kafka offset after calling `poll`. We will use this offset to
+ *                           poll when `records` is drained.
  */
-private[kafka010] case class InternalKafkaConsumer(
-    topicPartition: TopicPartition,
-    kafkaParams: ju.Map[String, Object]) extends Logging {
-  import InternalKafkaConsumer._
-
-  /**
-   * The internal object to store the fetched data from Kafka consumer and the next offset to poll.
-   *
-   * @param _records the pre-fetched Kafka records.
-   * @param _nextOffsetInFetchedData the next offset in `records`. We use this to verify if we
-   *                                 should check if the pre-fetched data is still valid.
-   * @param _offsetAfterPoll the Kafka offset after calling `poll`. We will use this offset to
-   *                           poll when `records` is drained.
-   */
-  private case class FetchedData(
-      private var _records: ju.ListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
-      private var _nextOffsetInFetchedData: Long,
-      private var _offsetAfterPoll: Long) {
-
-    def withNewPoll(
-        records: ju.ListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
-        offsetAfterPoll: Long): FetchedData = {
-      this._records = records
-      this._nextOffsetInFetchedData = UNKNOWN_OFFSET
-      this._offsetAfterPoll = offsetAfterPoll
-      this
-    }
-
-    /** Whether there are more elements */
-    def hasNext: Boolean = _records.hasNext
-
-    /** Move `records` forward and return the next record. */
-    def next(): ConsumerRecord[Array[Byte], Array[Byte]] = {
-      val record = _records.next()
-      _nextOffsetInFetchedData = record.offset + 1
-      record
-    }
+private[kafka010] case class FetchedData(
+    private var _records: ju.ListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
+    private var _nextOffsetInFetchedData: Long,
+    private var _offsetAfterPoll: Long) {
+
+  def withNewPoll(
+      records: ju.ListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
+      offsetAfterPoll: Long): FetchedData = {
+    this._records = records
+    this._nextOffsetInFetchedData = UNKNOWN_OFFSET
+    this._offsetAfterPoll = offsetAfterPoll
+    this
+  }
 
-    /** Move `records` backward and return the previous record. */
-    def previous(): ConsumerRecord[Array[Byte], Array[Byte]] = {
-      assert(_records.hasPrevious, "fetchedData cannot move back")
-      val record = _records.previous()
-      _nextOffsetInFetchedData = record.offset
-      record
-    }
+  /** Whether there are more elements */
+  def hasNext: Boolean = _records.hasNext
 
-    /** Reset the internal pre-fetched data. */
-    def reset(): Unit = {
-      _records = ju.Collections.emptyListIterator()
-      _nextOffsetInFetchedData = UNKNOWN_OFFSET
-      _offsetAfterPoll = UNKNOWN_OFFSET
-    }
+  /** Move `records` forward and return the next record. */
+  def next(): ConsumerRecord[Array[Byte], Array[Byte]] = {
+    val record = _records.next()
+    _nextOffsetInFetchedData = record.offset + 1
+    record
+  }
 
-    /**
-     * Returns the next offset in `records`. We use this to verify if we should check if the
-     * pre-fetched data is still valid.
-     */
-    def nextOffsetInFetchedData: Long = _nextOffsetInFetchedData
+  /** Move `records` backward and return the previous record. */
+  def previous(): ConsumerRecord[Array[Byte], Array[Byte]] = {
+    assert(_records.hasPrevious, "fetchedData cannot move back")
+    val record = _records.previous()
+    _nextOffsetInFetchedData = record.offset
+    record
+  }
 
-    /**
-     * Returns the next offset to poll after draining the pre-fetched records.
-     */
-    def offsetAfterPoll: Long = _offsetAfterPoll
+  /** Reset the internal pre-fetched data. */
+  def reset(): Unit = {
+    _records = ju.Collections.emptyListIterator()
+    _nextOffsetInFetchedData = UNKNOWN_OFFSET
+    _offsetAfterPoll = UNKNOWN_OFFSET
   }
 
   /**
-   * The internal object returned by the `fetchRecord` method. If `record` is empty, it means it is
-   * invisible (either a transaction message, or an aborted message when the consumer's
-   * `isolation.level` is `read_committed`), and the caller should use `nextOffsetToFetch` to fetch
-   * instead.
+   * Returns the next offset in `records`. We use this to verify if we should check if the
+   * pre-fetched data is still valid.
    */
-  private case class FetchedRecord(
-      var record: ConsumerRecord[Array[Byte], Array[Byte]],
-      var nextOffsetToFetch: Long) {
-
-    def withRecord(
-        record: ConsumerRecord[Array[Byte], Array[Byte]],
-        nextOffsetToFetch: Long): FetchedRecord = {
-      this.record = record
-      this.nextOffsetToFetch = nextOffsetToFetch
-      this
-    }
-  }
+  def nextOffsetInFetchedData: Long = _nextOffsetInFetchedData
 
-  private val groupId = kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String]
+  /**
+   * Returns the next offset to poll after draining the pre-fetched records.
+   */
+  def offsetAfterPoll: Long = _offsetAfterPoll
+}
 
-  @volatile private var consumer = createConsumer
+/**
+ * The internal object returned by the `fetchRecord` method. If `record` is empty, it means it is
+ * invisible (either a transaction message, or an aborted message when the consumer's
+ * `isolation.level` is `read_committed`), and the caller should use `nextOffsetToFetch` to fetch
+ * instead.
+ */
+private[kafka010] case class FetchedRecord(
+    var record: ConsumerRecord[Array[Byte], Array[Byte]],
+    var nextOffsetToFetch: Long) {
+
+  def withRecord(
+      record: ConsumerRecord[Array[Byte], Array[Byte]],
+      nextOffsetToFetch: Long): FetchedRecord = {
+    this.record = record
+    this.nextOffsetToFetch = nextOffsetToFetch
+    this
+  }
+}
 
-  /** indicates whether this consumer is in use or not */
-  @volatile var inUse = true
+/**
+ * This class helps caller to read from Kafka leveraging consumer pool as well as fetched data pool.
+ * This class throws error when data loss is detected while reading from Kafka.
+ *
+ * NOTE for contributors: we need to ensure all the public methods to initialize necessary resources
+ * via calling `getOrRetrieveConsumer` and `getOrRetrieveFetchedData`.
+ */
+private[kafka010] class KafkaDataConsumer(
+    topicPartition: TopicPartition,
+    kafkaParams: ju.Map[String, Object],
+    consumerPool: InternalKafkaConsumerPool,
+    fetchedDataPool: FetchedDataPool) extends Logging {
+  import KafkaDataConsumer._
 
-  /** indicate whether this consumer is going to be stopped in the next release */
-  @volatile var markedForClose = false
+  @volatile private[kafka010] var _consumer: Option[InternalKafkaConsumer] = None
+  @volatile private var _fetchedData: Option[FetchedData] = None
 
-  /**
-   * The fetched data returned from Kafka consumer. This is a reusable private object to avoid
-   * memory allocation.
-   */
-  private val fetchedData = FetchedData(
-    ju.Collections.emptyListIterator[ConsumerRecord[Array[Byte], Array[Byte]]],
-    UNKNOWN_OFFSET,
-    UNKNOWN_OFFSET)
+  private val groupId = kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String]
+  private val cacheKey = CacheKey(groupId, topicPartition)
 
   /**
    * The fetched record returned from the `fetchRecord` method. This is a reusable private object to
@@ -195,41 +227,30 @@ private[kafka010] case class InternalKafkaConsumer(
    */
   private val fetchedRecord: FetchedRecord = FetchedRecord(null, UNKNOWN_OFFSET)
 
-
-  /** Create a KafkaConsumer to fetch records for `topicPartition` */
-  private def createConsumer: KafkaConsumer[Array[Byte], Array[Byte]] = {
-    val updatedKafkaParams = KafkaConfigUpdater("executor", kafkaParams.asScala.toMap)
-      .setAuthenticationConfigIfNeeded()
-      .build()
-    val c = new KafkaConsumer[Array[Byte], Array[Byte]](updatedKafkaParams)
-    val tps = new ju.ArrayList[TopicPartition]()
-    tps.add(topicPartition)
-    c.assign(tps)
-    c
-  }
-
-  private def runUninterruptiblyIfPossible[T](body: => T): T = Thread.currentThread match {
-    case ut: UninterruptibleThread =>
-      ut.runUninterruptibly(body)
-    case _ =>
-      logWarning("CachedKafkaConsumer is not running in UninterruptibleThread. " +
-        "It may hang when CachedKafkaConsumer's methods are interrupted because of KAFKA-1894")
-      body
-  }
-
   /**
-   * Return the available offset range of the current partition. It's a pair of the earliest offset
-   * and the latest offset.
+   * Get the record for the given offset if available.
+   *
+   * If the record is invisible (either a
+   * transaction message, or an aborted message when the consumer's `isolation.level` is
+   * `read_committed`), it will be skipped and this method will try to fetch next available record
+   * within [offset, untilOffset).
+   *
+   * This method also will try its best to detect data loss. If `failOnDataLoss` is `true`, it will
+   * throw an exception when we detect an unavailable offset. If `failOnDataLoss` is `false`, this
+   * method will try to fetch next available record within [offset, untilOffset).
+   *
+   * When this method tries to skip offsets due to either invisible messages or data loss and
+   * reaches `untilOffset`, it will return `null`.
+   *
+   * @param offset         the offset to fetch.
+   * @param untilOffset    the max offset to fetch. Exclusive.
+   * @param pollTimeoutMs  timeout in milliseconds to poll data from Kafka.
+   * @param failOnDataLoss When `failOnDataLoss` is `true`, this method will either return record at
+   *                       offset if available, or throw exception.when `failOnDataLoss` is `false`,
+   *                       this method will either return record at offset if available, or return
+   *                       the next earliest available record less than untilOffset, or null. It
+   *                       will not throw any exception.
    */
-  def getAvailableOffsetRange(): AvailableOffsetRange = runUninterruptiblyIfPossible {
-    consumer.seekToBeginning(Set(topicPartition).asJava)
-    val earliestOffset = consumer.position(topicPartition)
-    consumer.seekToEnd(Set(topicPartition).asJava)
-    val latestOffset = consumer.position(topicPartition)
-    AvailableOffsetRange(earliestOffset, latestOffset)
-  }
-
-  /** @see [[KafkaDataConsumer.get]] */
   def get(
       offset: Long,
       untilOffset: Long,
@@ -238,8 +259,13 @@ private[kafka010] case class InternalKafkaConsumer(
     ConsumerRecord[Array[Byte], Array[Byte]] = runUninterruptiblyIfPossible {
     require(offset < untilOffset,
       s"offset must always be less than untilOffset [offset: $offset, untilOffset: $untilOffset]")
+
+    val consumer = getOrRetrieveConsumer()
+    val fetchedData = getOrRetrieveFetchedData(offset)
+
     logDebug(s"Get $groupId $topicPartition nextOffset ${fetchedData.nextOffsetInFetchedData} " +
-      s"requested $offset")
+      "requested $offset")
+
     // The following loop is basically for `failOnDataLoss = false`. When `failOnDataLoss` is
     // `false`, first, we will try to fetch the record at `offset`. If no such record exists, then
     // we will move to the next available offset within `[offset, untilOffset)` and retry.
@@ -252,7 +278,8 @@ private[kafka010] case class InternalKafkaConsumer(
 
     while (toFetchOffset != UNKNOWN_OFFSET && !isFetchComplete) {
       try {
-        fetchedRecord = fetchRecord(toFetchOffset, untilOffset, pollTimeoutMs, failOnDataLoss)
+        fetchedRecord = fetchRecord(consumer, fetchedData, toFetchOffset, untilOffset,
+          pollTimeoutMs, failOnDataLoss)
         if (fetchedRecord.record != null) {
           isFetchComplete = true
         } else {
@@ -266,12 +293,9 @@ private[kafka010] case class InternalKafkaConsumer(
         }
       } catch {
         case e: OffsetOutOfRangeException =>
-          // When there is some error thrown, it's better to use a new consumer to drop all cached
-          // states in the old consumer. We don't need to worry about the performance because this
-          // is not a common path.
-          resetConsumer()
-          reportDataLoss(failOnDataLoss, s"Cannot fetch offset $toFetchOffset", e)
-          toFetchOffset = getEarliestAvailableOffsetBetween(toFetchOffset, untilOffset)
+          reportDataLoss(topicPartition, groupId, failOnDataLoss,
+            s"Cannot fetch offset $toFetchOffset", e)
+          toFetchOffset = getEarliestAvailableOffsetBetween(consumer, toFetchOffset, untilOffset)
       }
     }
 
@@ -283,14 +307,45 @@ private[kafka010] case class InternalKafkaConsumer(
     }
   }
 
+  /**
+   * Return the available offset range of the current partition. It's a pair of the earliest offset
+   * and the latest offset.
+   */
+  def getAvailableOffsetRange(): AvailableOffsetRange = runUninterruptiblyIfPossible {
+    val consumer = getOrRetrieveConsumer()
+    consumer.getAvailableOffsetRange()
+  }
+
+  /**
+   * Release borrowed objects in data reader to the pool. Once the instance is created, caller
+   * must call method after using the instance to make sure resources are not leaked.
+   */
+  def release(): Unit = {
+    if (_consumer.isDefined) {
+      consumerPool.returnObject(_consumer.get)
+      _consumer = None
+    }
+
+    if (_fetchedData.isDefined) {
+      fetchedDataPool.release(cacheKey, _fetchedData.get)
+      _fetchedData = None
+    }
+  }
+
   /**
    * Return the next earliest available offset in [offset, untilOffset). If all offsets in
    * [offset, untilOffset) are invalid (e.g., the topic is deleted and recreated), it will return
    * `UNKNOWN_OFFSET`.
    */
-  private def getEarliestAvailableOffsetBetween(offset: Long, untilOffset: Long): Long = {
-    val range = getAvailableOffsetRange()
+  private def getEarliestAvailableOffsetBetween(
+      consumer: InternalKafkaConsumer,
+      offset: Long,
+      untilOffset: Long): Long = {
+    val range = consumer.getAvailableOffsetRange()
     logWarning(s"Some data may be lost. Recovering from the earliest offset: ${range.earliest}")
+
+    val topicPartition = consumer.topicPartition
+    val groupId = consumer.groupId
     if (offset >= range.latest || range.earliest >= untilOffset) {
       // [offset, untilOffset) and [earliestOffset, latestOffset) have no overlap,
       // either
@@ -305,10 +360,10 @@ private[kafka010] case class InternalKafkaConsumer(
       //      |          |              |                |
       //   offset   untilOffset   earliestOffset   latestOffset
       val warningMessage =
-        s"""
-          |The current available offset range is $range.
-          | Offset ${offset} is out of range, and records in [$offset, $untilOffset) will be
-          | skipped ${additionalMessage(failOnDataLoss = false)}
+      s"""
+         |The current available offset range is $range.
+         | Offset $offset is out of range, and records in [$offset, $untilOffset) will be
+         | skipped ${additionalMessage(topicPartition, groupId, failOnDataLoss = false)}
         """.stripMargin
       logWarning(warningMessage)
       UNKNOWN_OFFSET
@@ -321,8 +376,8 @@ private[kafka010] case class InternalKafkaConsumer(
       // This will happen when a topic is deleted and recreated, and new data are pushed very fast,
       // then we will see `offset` disappears first then appears again. Although the parameters
       // are same, the state in Kafka cluster is changed, so the outer loop won't be endless.
-      logWarning(s"Found a disappeared offset $offset. " +
-        s"Some data may be lost ${additionalMessage(failOnDataLoss = false)}")
+      logWarning(s"Found a disappeared offset $offset. Some data may be lost " +
+        s"${additionalMessage(topicPartition, groupId, failOnDataLoss = false)}")
       offset
     } else {
       // ------------------------------------------------------------------------------
@@ -330,10 +385,10 @@ private[kafka010] case class InternalKafkaConsumer(
       //      |           |                       |                                 |
       //   offset   earliestOffset   min(untilOffset,latestOffset)   max(untilOffset, latestOffset)
       val warningMessage =
-        s"""
-           |The current available offset range is $range.
-           | Offset ${offset} is out of range, and records in [$offset, ${range.earliest}) will be
-           | skipped ${additionalMessage(failOnDataLoss = false)}
+      s"""
+         |The current available offset range is $range.
+         | Offset ${offset} is out of range, and records in [$offset, ${range.earliest}) will be
+         | skipped ${additionalMessage(topicPartition, groupId, failOnDataLoss = false)}
         """.stripMargin
       logWarning(warningMessage)
       range.earliest
@@ -355,6 +410,8 @@ private[kafka010] case class InternalKafkaConsumer(
    * @throws TimeoutException if cannot fetch the record in `pollTimeoutMs` milliseconds.
    */
   private def fetchRecord(
+      consumer: InternalKafkaConsumer,
+      fetchedData: FetchedData,
       offset: Long,
       untilOffset: Long,
       pollTimeoutMs: Long,
@@ -362,7 +419,7 @@ private[kafka010] case class InternalKafkaConsumer(
     if (offset != fetchedData.nextOffsetInFetchedData) {
       // This is the first fetch, or the fetched data has been reset.
       // Fetch records from Kafka and update `fetchedData`.
-      fetchData(offset, pollTimeoutMs)
+      fetchData(consumer, fetchedData, offset, pollTimeoutMs)
     } else if (!fetchedData.hasNext) { // The last pre-fetched data has been drained.
       if (offset < fetchedData.offsetAfterPoll) {
         // Offsets in [offset, fetchedData.offsetAfterPoll) are invisible. Return a record to ask
@@ -372,7 +429,7 @@ private[kafka010] case class InternalKafkaConsumer(
         return fetchedRecord.withRecord(null, nextOffsetToFetch)
       } else {
         // Fetch records from Kafka and update `fetchedData`.
-        fetchData(offset, pollTimeoutMs)
+        fetchData(consumer, fetchedData, offset, pollTimeoutMs)
       }
     }
 
@@ -388,7 +445,7 @@ private[kafka010] case class InternalKafkaConsumer(
       // In general, Kafka uses the specified offset as the start point, and tries to fetch the next
       // available offset. Hence we need to handle offset mismatch.
       if (record.offset > offset) {
-        val range = getAvailableOffsetRange()
+        val range = consumer.getAvailableOffsetRange()
         if (range.earliest <= offset) {
           // `offset` is still valid but the corresponding message is invisible. We should skip it
           // and jump to `record.offset`. Here we move `fetchedData` back so that the next call of
@@ -398,16 +455,19 @@ private[kafka010] case class InternalKafkaConsumer(
         }
         // This may happen when some records aged out but their offsets already got verified
         if (failOnDataLoss) {
-          reportDataLoss(true, s"Cannot fetch records in [$offset, ${record.offset})")
+          reportDataLoss(consumer.topicPartition, consumer.groupId, failOnDataLoss = true,
+            s"Cannot fetch records in [$offset, ${record.offset})")
           // Never happen as "reportDataLoss" will throw an exception
           throw new IllegalStateException(
             "reportDataLoss didn't throw an exception when 'failOnDataLoss' is true")
         } else if (record.offset >= untilOffset) {
-          reportDataLoss(false, s"Skip missing records in [$offset, $untilOffset)")
+          reportDataLoss(consumer.topicPartition, consumer.groupId, failOnDataLoss = false,
+            s"Skip missing records in [$offset, $untilOffset)")
           // Set `nextOffsetToFetch` to `untilOffset` to finish the current batch.
           fetchedRecord.withRecord(null, untilOffset)
         } else {
-          reportDataLoss(false, s"Skip missing records in [$offset, ${record.offset})")
+          reportDataLoss(consumer.topicPartition, consumer.groupId, failOnDataLoss = false,
+            s"Skip missing records in [$offset, ${record.offset})")
           fetchedRecord.withRecord(record, fetchedData.nextOffsetInFetchedData)
         }
       } else if (record.offset < offset) {
@@ -421,17 +481,49 @@ private[kafka010] case class InternalKafkaConsumer(
     }
   }
 
-  /** Create a new consumer and reset cached states */
-  private def resetConsumer(): Unit = {
-    consumer.close()
-    consumer = createConsumer
-    fetchedData.reset()
+  /**
+   * Poll messages from Kafka starting from `offset` and update `fetchedData`. `fetchedData` may be
+   * empty if the Kafka consumer fetches some messages but all of them are not visible messages
+   * (either transaction messages, or aborted messages when `isolation.level` is `read_committed`).
+   *
+   * @throws OffsetOutOfRangeException if `offset` is out of range.
+   * @throws TimeoutException if the consumer position is not changed after polling. It means the
+   *                          consumer polls nothing before timeout.
+   */
+  private def fetchData(
+      consumer: InternalKafkaConsumer,
+      fetchedData: FetchedData,
+      offset: Long,
+      pollTimeoutMs: Long): Unit = {
+    val (records, offsetAfterPoll) = consumer.fetch(offset, pollTimeoutMs)
+    fetchedData.withNewPoll(records.listIterator, offsetAfterPoll)
+  }
+
+  private def getOrRetrieveConsumer(): InternalKafkaConsumer = _consumer match {
+    case None =>
+      _consumer = Option(consumerPool.borrowObject(cacheKey, kafkaParams))
+      require(_consumer.isDefined, "borrowing consumer from pool must always succeed.")
+      _consumer.get
+
+    case Some(consumer) => consumer
+  }
+
+  private def getOrRetrieveFetchedData(offset: Long): FetchedData = _fetchedData match {
+    case None =>
+      _fetchedData = Option(fetchedDataPool.acquire(cacheKey, offset))
+      require(_fetchedData.isDefined, "acquiring fetched data from cache must always succeed.")
+      _fetchedData.get
+
+    case Some(fetchedData) => fetchedData
   }
 
   /**
    * Return an addition message including useful message and instruction.
    */
-  private def additionalMessage(failOnDataLoss: Boolean): String = {
+  private def additionalMessage(
+      topicPartition: TopicPartition,
+      groupId: String,
+      failOnDataLoss: Boolean): String = {
     if (failOnDataLoss) {
       s"(GroupId: $groupId, TopicPartition: $topicPartition). " +
         s"$INSTRUCTION_FOR_FAIL_ON_DATA_LOSS_TRUE"
@@ -445,197 +537,69 @@ private[kafka010] case class InternalKafkaConsumer(
    * Throw an exception or log a warning as per `failOnDataLoss`.
    */
   private def reportDataLoss(
+      topicPartition: TopicPartition,
+      groupId: String,
       failOnDataLoss: Boolean,
       message: String,
       cause: Throwable = null): Unit = {
-    val finalMessage = s"$message ${additionalMessage(failOnDataLoss)}"
+    val finalMessage = s"$message ${additionalMessage(topicPartition, groupId, failOnDataLoss)}"
     reportDataLoss0(failOnDataLoss, finalMessage, cause)
   }
 
-  def close(): Unit = consumer.close()
-
-  private def seek(offset: Long): Unit = {
-    logDebug(s"Seeking to $groupId $topicPartition $offset")
-    consumer.seek(topicPartition, offset)
-  }
-
-  /**
-   * Poll messages from Kafka starting from `offset` and update `fetchedData`. `fetchedData` may be
-   * empty if the Kafka consumer fetches some messages but all of them are not visible messages
-   * (either transaction messages, or aborted messages when `isolation.level` is `read_committed`).
-   *
-   * @throws OffsetOutOfRangeException if `offset` is out of range.
-   * @throws TimeoutException if the consumer position is not changed after polling. It means the
-   *                          consumer polls nothing before timeout.
-   */
-  private def fetchData(offset: Long, pollTimeoutMs: Long): Unit = {
-    // Seek to the offset because we may call seekToBeginning or seekToEnd before this.
-    seek(offset)
-    val p = consumer.poll(pollTimeoutMs)
-    val r = p.records(topicPartition)
-    logDebug(s"Polled $groupId ${p.partitions()}  ${r.size}")
-    val offsetAfterPoll = consumer.position(topicPartition)
-    logDebug(s"Offset changed from $offset to $offsetAfterPoll after polling")
-    fetchedData.withNewPoll(r.listIterator, offsetAfterPoll)
-    if (!fetchedData.hasNext) {
-      // We cannot fetch anything after `poll`. Two possible cases:
-      // - `offset` is out of range so that Kafka returns nothing. `OffsetOutOfRangeException` will
-      //   be thrown.
-      // - Cannot fetch any data before timeout. `TimeoutException` will be thrown.
-      // - Fetched something but all of them are not invisible. This is a valid case and let the
-      //   caller handles this.
-      val range = getAvailableOffsetRange()
-      if (offset < range.earliest || offset >= range.latest) {
-        throw new OffsetOutOfRangeException(
-          Map(topicPartition -> java.lang.Long.valueOf(offset)).asJava)
-      } else if (offset == offsetAfterPoll) {
-        throw new TimeoutException(
-          s"Cannot fetch record for offset $offset in $pollTimeoutMs milliseconds")
-      }
-    }
+  private def runUninterruptiblyIfPossible[T](body: => T): T = Thread.currentThread match {
+    case ut: UninterruptibleThread =>
+      ut.runUninterruptibly(body)
+    case _ =>
+      logWarning("KafkaDataConsumer is not running in UninterruptibleThread. " +
+        "It may hang when KafkaDataConsumer's methods are interrupted because of KAFKA-1894")
+      body
   }
 }
 
-
 private[kafka010] object KafkaDataConsumer extends Logging {
+  val UNKNOWN_OFFSET = -2L
 
   case class AvailableOffsetRange(earliest: Long, latest: Long)
 
-  private case class CachedKafkaDataConsumer(internalConsumer: InternalKafkaConsumer)
-    extends KafkaDataConsumer {
-    assert(internalConsumer.inUse) // make sure this has been set to true
-    override def release(): Unit = { KafkaDataConsumer.release(internalConsumer) }
-  }
-
-  private case class NonCachedKafkaDataConsumer(internalConsumer: InternalKafkaConsumer)
-    extends KafkaDataConsumer {
-    override def release(): Unit = { internalConsumer.close() }
-  }
-
-  private[kafka010] case class CacheKey(groupId: String, topicPartition: TopicPartition) {
+  case class CacheKey(groupId: String, topicPartition: TopicPartition) {
     def this(topicPartition: TopicPartition, kafkaParams: ju.Map[String, Object]) =
       this(kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String], topicPartition)
   }
 
-  // This cache has the following important properties.
-  // - We make a best-effort attempt to maintain the max size of the cache as configured capacity.
-  //   The capacity is not guaranteed to be maintained, especially when there are more active
-  //   tasks simultaneously using consumers than the capacity.
-  private[kafka010] lazy val cache = {
-    val conf = SparkEnv.get.conf
-    val capacity = conf.get(CONSUMER_CACHE_CAPACITY)
-    new ju.LinkedHashMap[CacheKey, InternalKafkaConsumer](capacity, 0.75f, true) {
-      override def removeEldestEntry(
-        entry: ju.Map.Entry[CacheKey, InternalKafkaConsumer]): Boolean = {
-
-        // Try to remove the least-used entry if its currently not in use.
-        //
-        // If you cannot remove it, then the cache will keep growing. In the worst case,
-        // the cache will grow to the max number of concurrent tasks that can run in the executor,
-        // (that is, number of tasks slots) after which it will never reduce. This is unlikely to
-        // be a serious problem because an executor with more than 64 (default) tasks slots is
-        // likely running on a beefy machine that can handle a large number of simultaneously
-        // active consumers.
-
-        if (!entry.getValue.inUse && this.size > capacity) {
-          logWarning(
-            s"KafkaConsumer cache hitting max capacity of $capacity, " +
-              s"removing consumer for ${entry.getKey}")
-          try {
-            entry.getValue.close()
-          } catch {
-            case e: SparkException =>
-              logError(s"Error closing earliest Kafka consumer for ${entry.getKey}", e)
-          }
-          true
-        } else {
-          false
-        }
-      }
+  private val consumerPool = InternalKafkaConsumerPool.build
+  private val fetchedDataPool = FetchedDataPool.build
+
+  ShutdownHookManager.addShutdownHook { () =>
+    try {
+      fetchedDataPool.shutdown()
+      consumerPool.close()
+    } catch {
+      case e: Throwable =>
+        logWarning("Ignoring Exception while shutting down pools from shutdown hook", e)
     }
   }
 
   /**
-   * Get a cached consumer for groupId, assigned to topic and partition.
+   * Get a data reader for groupId, assigned to topic and partition.
    * If matching consumer doesn't already exist, will be created using kafkaParams.
-   * The returned consumer must be released explicitly using [[KafkaDataConsumer.release()]].
-   *
-   * Note: This method guarantees that the consumer returned is not currently in use by any one
-   * else. Within this guarantee, this method will make a best effort attempt to re-use consumers by
-   * caching them and tracking when they are in use.
+   * The returned data reader must be released explicitly.
    */
   def acquire(
       topicPartition: TopicPartition,
-      kafkaParams: ju.Map[String, Object],
-      useCache: Boolean): KafkaDataConsumer = synchronized {
-    val key = new CacheKey(topicPartition, kafkaParams)
-    val existingInternalConsumer = cache.get(key)
-
-    lazy val newInternalConsumer = new InternalKafkaConsumer(topicPartition, kafkaParams)
-
+      kafkaParams: ju.Map[String, Object]): KafkaDataConsumer = {
     if (TaskContext.get != null && TaskContext.get.attemptNumber >= 1) {
-      // If this is reattempt at running the task, then invalidate cached consumer if any and
-      // start with a new one.
-      if (existingInternalConsumer != null) {
-        // Consumer exists in cache. If its in use, mark it for closing later, or close it now.
-        if (existingInternalConsumer.inUse) {
-          existingInternalConsumer.markedForClose = true
-        } else {
-          existingInternalConsumer.close()
-        }
-      }
-      cache.remove(key)  // Invalidate the cache in any case
-      NonCachedKafkaDataConsumer(newInternalConsumer)
-
-    } else if (!useCache) {
-      // If planner asks to not reuse consumers, then do not use it, return a new consumer
-      NonCachedKafkaDataConsumer(newInternalConsumer)
+      val cacheKey = new CacheKey(topicPartition, kafkaParams)
 
-    } else if (existingInternalConsumer == null) {
-      // If consumer is not already cached, then put a new in the cache and return it
-      cache.put(key, newInternalConsumer)
-      newInternalConsumer.inUse = true
-      CachedKafkaDataConsumer(newInternalConsumer)
+      // If this is reattempt at running the task, then invalidate cached consumer if any.
+      consumerPool.invalidateKey(cacheKey)
 
-    } else if (existingInternalConsumer.inUse) {
-      // If consumer is already cached but is currently in use, then return a new consumer
-      NonCachedKafkaDataConsumer(newInternalConsumer)
-
-    } else {
-      // If consumer is already cached and is currently not in use, then return that consumer
-      existingInternalConsumer.inUse = true
-      CachedKafkaDataConsumer(existingInternalConsumer)
+      // invalidate all fetched data for the key as well
+      // sadly we can't pinpoint specific data and invalidate cause we don't have unique id
+      fetchedDataPool.invalidate(cacheKey)
     }
-  }
 
-  private def release(intConsumer: InternalKafkaConsumer): Unit = {
-    synchronized {
-
-      // Clear the consumer from the cache if this is indeed the consumer present in the cache
-      val key = new CacheKey(intConsumer.topicPartition, intConsumer.kafkaParams)
-      val cachedIntConsumer = cache.get(key)
-      if (intConsumer.eq(cachedIntConsumer)) {
-        // The released consumer is the same object as the cached one.
-        if (intConsumer.markedForClose) {
-          intConsumer.close()
-          cache.remove(key)
-        } else {
-          intConsumer.inUse = false
-        }
-      } else {
-        // The released consumer is either not the same one as in the cache, or not in the cache
-        // at all. This may happen if the cache was invalidate while this consumer was being used.
-        // Just close this consumer.
-        intConsumer.close()
-        logInfo(s"Released a supposedly cached consumer that was not found in the cache")
-      }
-    }
+    new KafkaDataConsumer(topicPartition, kafkaParams, consumerPool, fetchedDataPool)
   }
-}
-
-private[kafka010] object InternalKafkaConsumer extends Logging {
-
-  private val UNKNOWN_OFFSET = -2L
 
   private def reportDataLoss0(
       failOnDataLoss: Boolean,
@@ -655,4 +619,5 @@ private[kafka010] object InternalKafkaConsumer extends Logging {
       }
     }
   }
+
 }
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
index 08a52ddbd19b..9cd16c8e1624 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
@@ -144,14 +144,9 @@ private[kafka010] class KafkaMicroBatchStream(
       untilOffsets = untilOffsets,
       executorLocations = getSortedExecutorList())
 
-    // Reuse Kafka consumers only when all the offset ranges have distinct TopicPartitions,
-    // that is, concurrent tasks will not read the same TopicPartitions.
-    val reuseKafkaConsumer = offsetRanges.map(_.topicPartition).toSet.size == offsetRanges.size
-
     // Generate factories based on the offset ranges
     offsetRanges.map { range =>
-      KafkaBatchInputPartition(
-        range, executorKafkaParams, pollTimeoutMs, failOnDataLoss, reuseKafkaConsumer)
+      KafkaBatchInputPartition(range, executorKafkaParams, pollTimeoutMs, failOnDataLoss)
     }.toArray
   }
 
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
index dd584a5987a0..dc7087821b10 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
@@ -102,7 +102,7 @@ private[kafka010] class KafkaRelation(
       KafkaSourceProvider.kafkaParamsForExecutors(specifiedKafkaParams, uniqueGroupId)
     val rdd = new KafkaSourceRDD(
       sqlContext.sparkContext, executorKafkaParams, offsetRanges,
-      pollTimeoutMs, failOnDataLoss, reuseKafkaConsumer = false).map { cr =>
+      pollTimeoutMs, failOnDataLoss).map { cr =>
       InternalRow(
         cr.key,
         cr.value,
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
index f477c35dcf39..d1a35ec53bc9 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
@@ -268,8 +268,7 @@ private[kafka010] class KafkaSource(
 
     // Create an RDD that reads from Kafka and get the (key, value) pair as byte arrays.
     val rdd = new KafkaSourceRDD(
-      sc, executorKafkaParams, offsetRanges, pollTimeoutMs, failOnDataLoss,
-      reuseKafkaConsumer = true).map { cr =>
+      sc, executorKafkaParams, offsetRanges, pollTimeoutMs, failOnDataLoss).map { cr =>
       InternalRow(
         cr.key,
         cr.value,
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
index f8b90056d293..dae9515205f5 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
@@ -63,8 +63,7 @@ private[kafka010] class KafkaSourceRDD(
     executorKafkaParams: ju.Map[String, Object],
     offsetRanges: Seq[KafkaSourceRDDOffsetRange],
     pollTimeoutMs: Long,
-    failOnDataLoss: Boolean,
-    reuseKafkaConsumer: Boolean)
+    failOnDataLoss: Boolean)
   extends RDD[ConsumerRecord[Array[Byte], Array[Byte]]](sc, Nil) {
 
   override def persist(newLevel: StorageLevel): this.type = {
@@ -87,7 +86,7 @@ private[kafka010] class KafkaSourceRDD(
       context: TaskContext): Iterator[ConsumerRecord[Array[Byte], Array[Byte]]] = {
     val sourcePartition = thePart.asInstanceOf[KafkaSourceRDDPartition]
     val consumer = KafkaDataConsumer.acquire(
-      sourcePartition.offsetRange.topicPartition, executorKafkaParams, reuseKafkaConsumer)
+      sourcePartition.offsetRange.topicPartition, executorKafkaParams)
 
     val range = resolveRange(consumer, sourcePartition.offsetRange)
     assert(
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
index ff19862c20cc..b24c0f1aa143 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
@@ -38,4 +38,25 @@ package object kafka010 {   // scalastyle:ignore
         " (check Structured Streaming Kafka integration guide for further details).")
       .intConf
       .createWithDefault(64)
+
+  private[kafka010] val CONSUMER_CACHE_JMX_ENABLED =
+    ConfigBuilder("spark.kafka.consumer.cache.jmx.enable")
+      .doc("Enable or disable JMX for pools created with this configuration instance.")
+      .booleanConf
+      .createWithDefault(false)
+
+  private[kafka010] val CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS =
+    ConfigBuilder("spark.kafka.consumer.cache.minEvictableIdleTimeMillis")
+      .doc("The minimum amount of time an object may sit idle in the pool before " +
+        "it is eligible for eviction by the idle object evictor. " +
+        "When non-positive, no objects will be evicted from the pool due to idle time alone.")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("5m")
+
+  private[kafka010] val CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS =
+    ConfigBuilder("spark.kafka.consumer.cache.evictorThreadRunIntervalMillis")
+      .doc("The number of milliseconds to sleep between runs of the idle object evictor thread. " +
+        "When non-positive, no idle object evictor thread will be run.")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("3m")
 }
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
new file mode 100644
index 000000000000..ad3975d673f3
--- /dev/null
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -0,0 +1,337 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.kafka010
+
+import java.{util => ju}
+
+import scala.collection.JavaConverters._
+import scala.collection.mutable
+
+import org.apache.kafka.clients.consumer.ConsumerRecord
+import org.apache.kafka.common.TopicPartition
+import org.scalatest.PrivateMethodTester
+
+import org.apache.spark.SparkEnv
+import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
+import org.apache.spark.sql.test.SharedSparkSession
+
+class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
+  import FetchedDataPool._
+  type Record = ConsumerRecord[Array[Byte], Array[Byte]]
+
+  private val dummyBytes = "dummy".getBytes
+
+  // Helper private method accessors for FetchedDataPool
+  private type PoolCacheType = mutable.Map[CacheKey, CachedFetchedDataList]
+  private val _cache = PrivateMethod[PoolCacheType]('cache)
+
+  def getCache(pool: FetchedDataPool): PoolCacheType = {
+    pool.invokePrivate(_cache())
+  }
+
+  test("acquire fresh one") {
+    val dataPool = FetchedDataPool.build
+
+    val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
+
+    assert(getCache(dataPool).get(cacheKey).isEmpty)
+
+    val data = dataPool.acquire(cacheKey, 0)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(getCache(dataPool)(cacheKey).head.inUse)
+
+    data.withNewPoll(testRecords(0, 5).listIterator, 5)
+
+    dataPool.release(cacheKey, data)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(!getCache(dataPool)(cacheKey).head.inUse)
+
+    dataPool.shutdown()
+  }
+
+  test("acquire fetched data from multiple keys") {
+    val dataPool = FetchedDataPool.build
+
+    val cacheKeys = (0 until 10).map { partId =>
+      CacheKey("testgroup", new TopicPartition("topic", partId))
+    }
+
+    assert(getCache(dataPool).size === 0)
+    cacheKeys.foreach { key => assert(getCache(dataPool).get(key).isEmpty) }
+
+    val dataList = cacheKeys.map(key => (key, dataPool.acquire(key, 0)))
+
+    assert(getCache(dataPool).size === cacheKeys.size)
+    cacheKeys.map { key =>
+      assert(getCache(dataPool)(key).size === 1)
+      assert(getCache(dataPool)(key).head.inUse)
+    }
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 10)
+
+    dataList.map { case (_, data) =>
+      data.withNewPoll(testRecords(0, 5).listIterator, 5)
+    }
+
+    dataList.foreach { case (key, data) =>
+      dataPool.release(key, data)
+    }
+
+    assert(getCache(dataPool).size === cacheKeys.size)
+    cacheKeys.map { key =>
+      assert(getCache(dataPool)(key).size === 1)
+      assert(!getCache(dataPool)(key).head.inUse)
+    }
+
+    dataPool.shutdown()
+  }
+
+  test("continuous use of fetched data from single key") {
+    val dataPool = FetchedDataPool.build
+
+    val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
+
+    assert(getCache(dataPool).get(cacheKey).isEmpty)
+
+    val data = dataPool.acquire(cacheKey, 0)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(getCache(dataPool)(cacheKey).head.inUse)
+
+    data.withNewPoll(testRecords(0, 5).listIterator, 5)
+
+    (0 to 3).foreach { _ => data.next() }
+
+    dataPool.release(cacheKey, data)
+
+    // suppose next batch
+
+    val data2 = dataPool.acquire(cacheKey, data.nextOffsetInFetchedData)
+
+    assert(data.eq(data2))
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(getCache(dataPool)(cacheKey).head.inUse)
+
+    dataPool.release(cacheKey, data2)
+
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(!getCache(dataPool)(cacheKey).head.inUse)
+
+    dataPool.shutdown()
+  }
+
+  test("multiple tasks referring same key continuously using fetched data") {
+    val dataPool = FetchedDataPool.build
+
+    val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
+
+    assert(getCache(dataPool).get(cacheKey).isEmpty)
+
+    val dataFromTask1 = dataPool.acquire(cacheKey, 0)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+    assert(getCache(dataPool)(cacheKey).size === 1)
+    assert(getCache(dataPool)(cacheKey).head.inUse)
+
+    val dataFromTask2 = dataPool.acquire(cacheKey, 0)
+
+    // it shouldn't give same object as dataFromTask1 though it asks same offset
+    // it definitely works when offsets are not overlapped: skip adding test for that
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+    assert(getCache(dataPool)(cacheKey).size === 2)
+    assert(getCache(dataPool)(cacheKey)(1).inUse)
+
+    // reading from task 1
+    dataFromTask1.withNewPoll(testRecords(0, 5).listIterator, 5)
+
+    (0 to 3).foreach { _ => dataFromTask1.next() }
+
+    dataPool.release(cacheKey, dataFromTask1)
+
+    // reading from task 2
+    dataFromTask2.withNewPoll(testRecords(0, 30).listIterator, 30)
+
+    (0 to 5).foreach { _ => dataFromTask2.next() }
+
+    dataPool.release(cacheKey, dataFromTask2)
+
+    // suppose next batch for task 1
+    val data2FromTask1 = dataPool.acquire(cacheKey, dataFromTask1.nextOffsetInFetchedData)
+    assert(data2FromTask1.eq(dataFromTask1))
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+    assert(getCache(dataPool)(cacheKey).head.inUse)
+
+    // suppose next batch for task 2
+    val data2FromTask2 = dataPool.acquire(cacheKey, dataFromTask2.nextOffsetInFetchedData)
+    assert(data2FromTask2.eq(dataFromTask2))
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+    assert(getCache(dataPool)(cacheKey)(1).inUse)
+
+    // release from task 2
+    dataPool.release(cacheKey, data2FromTask2)
+    assert(!getCache(dataPool)(cacheKey)(1).inUse)
+
+    // release from task 1
+    dataPool.release(cacheKey, data2FromTask1)
+    assert(!getCache(dataPool)(cacheKey).head.inUse)
+
+    dataPool.shutdown()
+  }
+
+  test("evict idle fetched data") {
+    import FetchedDataPool._
+    import org.scalatest.time.SpanSugar._
+
+    val minEvictableIdleTimeMillis = 1000
+    val evictorThreadRunIntervalMillis = 500
+
+    val newConf = Seq(
+      CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS -> minEvictableIdleTimeMillis.toString,
+      CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS -> evictorThreadRunIntervalMillis.toString)
+
+    withSparkConf(newConf: _*) {
+      val dataPool = FetchedDataPool.build
+
+      val cacheKeys = (0 until 10).map { partId =>
+        CacheKey("testgroup", new TopicPartition("topic", partId))
+      }
+
+      val dataList = cacheKeys.map(key => (key, dataPool.acquire(key, 0)))
+
+      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 10)
+
+      dataList.map { case (_, data) =>
+        data.withNewPoll(testRecords(0, 5).listIterator, 5)
+      }
+
+      val dataToEvict = dataList.take(3)
+      dataToEvict.foreach { case (key, data) =>
+        dataPool.release(key, data)
+      }
+
+      // wait up to twice than minEvictableIdleTimeMillis to ensure evictor thread to clear up
+      // idle objects
+      eventually(timeout((minEvictableIdleTimeMillis.toLong * 2).milliseconds),
+        interval(evictorThreadRunIntervalMillis.milliseconds)) {
+        // idle objects should be evicted
+        dataToEvict.map { case (key, _) =>
+          assert(getCache(dataPool)(key).isEmpty)
+        }
+      }
+
+      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
+      assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
+
+      dataList.takeRight(3).foreach { case (key, data) =>
+        dataPool.release(key, data)
+      }
+
+      // ensure releasing more objects don't trigger eviction immediately
+      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
+      assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
+
+      dataPool.shutdown()
+    }
+  }
+
+  test("invalidate key") {
+    val dataPool = FetchedDataPool.build
+
+    val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
+
+    val dataFromTask1 = dataPool.acquire(cacheKey, 0)
+    val dataFromTask2 = dataPool.acquire(cacheKey, 0)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+
+    // 1 idle, 1 active
+    dataPool.release(cacheKey, dataFromTask1)
+
+    val cacheKey2 = CacheKey("testgroup", new TopicPartition("topic", 1))
+
+    dataPool.acquire(cacheKey2, 0)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 3, expectedNumTotal = 3)
+    assert(getCache(dataPool).size === 2)
+    assert(getCache(dataPool)(cacheKey).size === 2)
+    assert(getCache(dataPool)(cacheKey2).size === 1)
+
+    dataPool.invalidate(cacheKey)
+
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 3, expectedNumTotal = 1)
+    assert(getCache(dataPool).size === 1)
+    assert(getCache(dataPool).get(cacheKey).isEmpty)
+
+    // it doesn't affect other keys
+    assert(getCache(dataPool)(cacheKey2).size === 1)
+
+    dataPool.release(cacheKey, dataFromTask2)
+
+    // it doesn't throw error on invalidated objects, but it doesn't cache them again
+    assert(getCache(dataPool).size === 1)
+    assert(getCache(dataPool).get(cacheKey).isEmpty)
+
+    dataPool.shutdown()
+  }
+
+
+  private def testRecords(startOffset: Long, count: Int): ju.List[Record] = {
+    (0 until count).map { offset =>
+      new Record("topic", 0, startOffset + offset, dummyBytes, dummyBytes)
+    }.toList.asJava
+  }
+
+  private def withSparkConf(pairs: (String, String)*)(f: => Unit): Unit = {
+    val conf = SparkEnv.get.conf
+
+    val (keys, values) = pairs.unzip
+    val currentValues = keys.map { key =>
+      if (conf.contains(key)) {
+        Some(conf.get(key))
+      } else {
+        None
+      }
+    }
+
+    (keys, values).zipped.foreach { conf.set }
+
+    try f finally {
+      keys.zip(currentValues).foreach {
+        case (key, Some(value)) => conf.set(key, value)
+        case (key, None) => conf.remove(key)
+      }
+    }
+  }
+
+  private def assertFetchedDataPoolStatistic(
+      fetchedDataPool: FetchedDataPool,
+      expectedNumCreated: Long,
+      expectedNumTotal: Long): Unit = {
+    assert(fetchedDataPool.getNumCreated === expectedNumCreated)
+    assert(fetchedDataPool.getNumTotal === expectedNumTotal)
+  }
+}
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
new file mode 100644
index 000000000000..7aa13b7042e3
--- /dev/null
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
@@ -0,0 +1,316 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.kafka010
+
+import java.{util => ju}
+
+import scala.collection.JavaConverters._
+
+import org.apache.kafka.clients.consumer.ConsumerConfig._
+import org.apache.kafka.common.TopicPartition
+import org.apache.kafka.common.serialization.ByteArrayDeserializer
+
+import org.apache.spark.SparkEnv
+import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
+import org.apache.spark.sql.test.SharedSparkSession
+
+class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
+
+  test("basic multiple borrows and returns for single key") {
+    val pool = InternalKafkaConsumerPool.build
+
+    val topic = "topic"
+    val partitionId = 0
+    val topicPartition = new TopicPartition(topic, partitionId)
+
+    val kafkaParams: ju.Map[String, Object] = getTestKafkaParams
+
+    val key = new CacheKey(topicPartition, kafkaParams)
+
+    val pooledObjects = (0 to 2).map { _ =>
+      val pooledObject = pool.borrowObject(key, kafkaParams)
+      assertPooledObject(pooledObject, topicPartition, kafkaParams)
+      pooledObject
+    }
+
+    assertPoolStateForKey(pool, key, numIdle = 0, numActive = 3, numTotal = 3)
+    assertPoolState(pool, numIdle = 0, numActive = 3, numTotal = 3)
+
+    val pooledObject2 = pool.borrowObject(key, kafkaParams)
+
+    assertPooledObject(pooledObject2, topicPartition, kafkaParams)
+    assertPoolStateForKey(pool, key, numIdle = 0, numActive = 4, numTotal = 4)
+    assertPoolState(pool, numIdle = 0, numActive = 4, numTotal = 4)
+
+    pooledObjects.foreach(pool.returnObject)
+
+    assertPoolStateForKey(pool, key, numIdle = 3, numActive = 1, numTotal = 4)
+    assertPoolState(pool, numIdle = 3, numActive = 1, numTotal = 4)
+
+    pool.returnObject(pooledObject2)
+
+    // we only allow three idle objects per key
+    assertPoolStateForKey(pool, key, numIdle = 3, numActive = 0, numTotal = 3)
+    assertPoolState(pool, numIdle = 3, numActive = 0, numTotal = 3)
+
+    pool.close()
+  }
+
+  test("basic borrow and return for multiple keys") {
+    val pool = InternalKafkaConsumerPool.build
+
+    val kafkaParams = getTestKafkaParams
+    val topicPartitions = createTopicPartitions(Seq("topic", "topic2"), 6)
+    val keys = createCacheKeys(topicPartitions, kafkaParams)
+
+    // while in loop pool doesn't still exceed total pool size
+    val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
+
+    assertPoolState(pool, numIdle = 0, numActive = keyToPooledObjectPairs.length,
+      numTotal = keyToPooledObjectPairs.length)
+
+    returnObjects(pool, keyToPooledObjectPairs)
+
+    assertPoolState(pool, numIdle = keyToPooledObjectPairs.length, numActive = 0,
+      numTotal = keyToPooledObjectPairs.length)
+
+    pool.close()
+  }
+
+  test("borrow more than soft max capacity from pool which is neither free space nor idle object") {
+    testWithPoolBorrowedSoftMaxCapacity { (pool, kafkaParams, keyToPooledObjectPairs) =>
+      val moreTopicPartition = new TopicPartition("topic2", 0)
+      val newCacheKey = new CacheKey(moreTopicPartition, kafkaParams)
+
+      // exceeds soft max pool size, and also no idle object for cleaning up
+      // but pool will borrow a new object
+      pool.borrowObject(newCacheKey, kafkaParams)
+
+      assertPoolState(pool, numIdle = 0, numActive = keyToPooledObjectPairs.length + 1,
+        numTotal = keyToPooledObjectPairs.length + 1)
+    }
+  }
+
+  test("borrow more than soft max capacity from pool frees up idle objects automatically") {
+    testWithPoolBorrowedSoftMaxCapacity { (pool, kafkaParams, keyToPooledObjectPairs) =>
+      // return 20% of objects to ensure there're some idle objects to free up later
+      val numToReturn = (keyToPooledObjectPairs.length * 0.2).toInt
+      returnObjects(pool, keyToPooledObjectPairs.take(numToReturn))
+
+      assertPoolState(pool, numIdle = numToReturn,
+        numActive = keyToPooledObjectPairs.length - numToReturn,
+        numTotal = keyToPooledObjectPairs.length)
+
+      // borrow a new object: there should be some idle objects to clean up
+      val moreTopicPartition = new TopicPartition("topic2", 0)
+      val newCacheKey = new CacheKey(moreTopicPartition, kafkaParams)
+
+      val newObject = pool.borrowObject(newCacheKey, kafkaParams)
+      assertPooledObject(newObject, moreTopicPartition, kafkaParams)
+      assertPoolStateForKey(pool, newCacheKey, numIdle = 0, numActive = 1, numTotal = 1)
+
+      // at least one of idle object should be freed up
+      assert(pool.getNumIdle < numToReturn)
+      // we can determine number of active objects correctly
+      assert(pool.getNumActive === keyToPooledObjectPairs.length - numToReturn + 1)
+      // total objects should be more than number of active + 1 but can't expect exact number
+      assert(pool.getTotal > keyToPooledObjectPairs.length - numToReturn + 1)
+    }
+  }
+
+
+  private def testWithPoolBorrowedSoftMaxCapacity(
+      testFn: (InternalKafkaConsumerPool,
+        ju.Map[String, Object],
+        Seq[(CacheKey, InternalKafkaConsumer)]) => Unit): Unit = {
+    val capacity = 16
+    val newConf = newConfForKafkaPool(Some(capacity), Some(-1), Some(-1))
+
+    withSparkConf(newConf: _*) {
+      val pool = InternalKafkaConsumerPool.build
+
+      try {
+        val kafkaParams = getTestKafkaParams
+        val topicPartitions = createTopicPartitions(Seq("topic"), capacity)
+        val keys = createCacheKeys(topicPartitions, kafkaParams)
+
+        // borrow objects which makes pool reaching soft capacity
+        val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
+
+        testFn(pool, kafkaParams, keyToPooledObjectPairs)
+      } finally {
+        pool.close()
+      }
+    }
+  }
+
+  test("evicting idle objects on background") {
+    import org.scalatest.time.SpanSugar._
+
+    val minEvictableIdleTimeMillis = 3 * 1000 // 3 seconds
+    val evictorThreadRunIntervalMillis = 500 // triggering multiple evictions by intention
+
+    val newConf = newConfForKafkaPool(None, Some(minEvictableIdleTimeMillis),
+      Some(evictorThreadRunIntervalMillis))
+    withSparkConf(newConf: _*) {
+      val pool = InternalKafkaConsumerPool.build
+
+      val kafkaParams = getTestKafkaParams
+      val topicPartitions = createTopicPartitions(Seq("topic"), 10)
+      val keys = createCacheKeys(topicPartitions, kafkaParams)
+
+      // borrow and return some consumers to ensure some partitions are being idle
+      // this test covers the use cases: rebalance / topic removal happens while running query
+      val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
+      val objectsToReturn = keyToPooledObjectPairs.filter(_._1.topicPartition.partition() % 2 == 0)
+      returnObjects(pool, objectsToReturn)
+
+      // wait up to twice than minEvictableIdleTimeMillis to ensure evictor thread to clear up
+      // idle objects
+      eventually(timeout((minEvictableIdleTimeMillis.toLong * 2).seconds),
+        interval(evictorThreadRunIntervalMillis.milliseconds)) {
+        assertPoolState(pool, numIdle = 0, numActive = 5, numTotal = 5)
+      }
+
+      pool.close()
+    }
+  }
+
+  private def newConfForKafkaPool(
+      capacity: Option[Int],
+      minEvictableIdleTimeMillis: Option[Long],
+      evictorThreadRunIntervalMillis: Option[Long]): Seq[(String, String)] = {
+    Seq(
+      CONSUMER_CACHE_CAPACITY.key -> capacity,
+      CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS.key -> minEvictableIdleTimeMillis,
+      CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS.key -> evictorThreadRunIntervalMillis
+    ).filter(_._2.isDefined).map(e => (e._1 -> e._2.get.toString))
+  }
+
+  private def createTopicPartitions(
+      topicNames: Seq[String],
+      countPartition: Int): List[TopicPartition] = {
+    for (
+      topic <- topicNames.toList;
+      partitionId <- 0 until countPartition
+    ) yield new TopicPartition(topic, partitionId)
+  }
+
+  private def createCacheKeys(
+      topicPartitions: List[TopicPartition],
+      kafkaParams: ju.Map[String, Object]): List[CacheKey] = {
+    topicPartitions.map(new CacheKey(_, kafkaParams))
+  }
+
+  private def assertPooledObject(
+      pooledObject: InternalKafkaConsumer,
+      expectedTopicPartition: TopicPartition,
+      expectedKafkaParams: ju.Map[String, Object]): Unit = {
+    assert(pooledObject != null)
+    assert(pooledObject.kafkaParams === expectedKafkaParams)
+    assert(pooledObject.topicPartition === expectedTopicPartition)
+  }
+
+  private def assertPoolState(
+      pool: InternalKafkaConsumerPool,
+      numIdle: Int,
+      numActive: Int,
+      numTotal: Int): Unit = {
+    assert(pool.getNumIdle === numIdle)
+    assert(pool.getNumActive === numActive)
+    assert(pool.getTotal === numTotal)
+  }
+
+  private def assertPoolStateForKey(
+      pool: InternalKafkaConsumerPool,
+      key: CacheKey,
+      numIdle: Int,
+      numActive: Int,
+      numTotal: Int): Unit = {
+    assert(pool.getNumIdle(key) === numIdle)
+    assert(pool.getNumActive(key) === numActive)
+    assert(pool.getTotal(key) === numTotal)
+  }
+
+  private def getTestKafkaParams: ju.Map[String, Object] = Map[String, Object](
+    GROUP_ID_CONFIG -> "groupId",
+    BOOTSTRAP_SERVERS_CONFIG -> "PLAINTEXT://localhost:9092",
+    KEY_DESERIALIZER_CLASS_CONFIG -> classOf[ByteArrayDeserializer].getName,
+    VALUE_DESERIALIZER_CLASS_CONFIG -> classOf[ByteArrayDeserializer].getName,
+    AUTO_OFFSET_RESET_CONFIG -> "earliest",
+    ENABLE_AUTO_COMMIT_CONFIG -> "false"
+  ).asJava
+
+  private def borrowObjectsPerKey(
+      pool: InternalKafkaConsumerPool,
+      kafkaParams: ju.Map[String, Object],
+      keys: List[CacheKey]): Seq[(CacheKey, InternalKafkaConsumer)] = {
+    keys.map { key =>
+      val numActiveBeforeBorrowing = pool.getNumActive
+      val numIdleBeforeBorrowing = pool.getNumIdle
+      val numTotalBeforeBorrowing = pool.getTotal
+
+      val pooledObj = pool.borrowObject(key, kafkaParams)
+
+      assertPoolStateForKey(pool, key, numIdle = 0, numActive = 1, numTotal = 1)
+      assertPoolState(pool, numIdle = numIdleBeforeBorrowing,
+        numActive = numActiveBeforeBorrowing + 1, numTotal = numTotalBeforeBorrowing + 1)
+
+      (key, pooledObj)
+    }
+  }
+
+  private def returnObjects(
+      pool: InternalKafkaConsumerPool,
+      objects: Seq[(CacheKey, InternalKafkaConsumer)]): Unit = {
+    objects.foreach { case (key, pooledObj) =>
+      val numActiveBeforeReturning = pool.getNumActive
+      val numIdleBeforeReturning = pool.getNumIdle
+      val numTotalBeforeReturning = pool.getTotal
+
+      pool.returnObject(pooledObj)
+
+      // we only allow one idle object per key
+      assertPoolStateForKey(pool, key, numIdle = 1, numActive = 0, numTotal = 1)
+      assertPoolState(pool, numIdle = numIdleBeforeReturning + 1,
+        numActive = numActiveBeforeReturning - 1, numTotal = numTotalBeforeReturning)
+    }
+  }
+
+  private def withSparkConf(pairs: (String, String)*)(f: => Unit): Unit = {
+    val conf = SparkEnv.get.conf
+
+    val (keys, values) = pairs.unzip
+    val currentValues = keys.map { key =>
+      if (conf.contains(key)) {
+        Some(conf.get(key))
+      } else {
+        None
+      }
+    }
+
+    (keys, values).zipped.foreach { conf.set }
+
+    try f finally {
+      keys.zip(currentValues).foreach {
+        case (key, Some(value)) => conf.set(key, value)
+        case (key, None) => conf.remove(key)
+      }
+    }
+  }
+}
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
index 8aa7e06e772a..3c89f5f7efd6 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.kafka010
 import java.util.concurrent.{Executors, TimeUnit}
 
 import scala.collection.JavaConverters._
+import scala.collection.immutable
 import scala.util.Random
 
 import org.apache.kafka.clients.consumer.ConsumerConfig._
@@ -60,49 +61,83 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
     AUTO_OFFSET_RESET_CONFIG -> "earliest",
     ENABLE_AUTO_COMMIT_CONFIG -> "false"
   ).asJava
+  private var fetchedDataPool: FetchedDataPool = _
+  private var consumerPool: InternalKafkaConsumerPool = _
+
+  override def beforeEach(): Unit = {
+    fetchedDataPool = {
+      val fetchedDataPoolMethod = PrivateMethod[FetchedDataPool]('fetchedDataPool)
+      KafkaDataConsumer.invokePrivate(fetchedDataPoolMethod())
+    }
+
+    consumerPool = {
+      val internalKafkaConsumerPoolMethod = PrivateMethod[InternalKafkaConsumerPool]('consumerPool)
+      KafkaDataConsumer.invokePrivate(internalKafkaConsumerPoolMethod())
+    }
+
+    fetchedDataPool.reset()
+    consumerPool.reset()
+  }
 
   test("SPARK-19886: Report error cause correctly in reportDataLoss") {
     val cause = new Exception("D'oh!")
     val reportDataLoss = PrivateMethod[Unit]('reportDataLoss0)
     val e = intercept[IllegalStateException] {
-      InternalKafkaConsumer.invokePrivate(reportDataLoss(true, "message", cause))
+      KafkaDataConsumer.invokePrivate(reportDataLoss(true, "message", cause))
     }
     assert(e.getCause === cause)
   }
 
   test("new KafkaDataConsumer instance in case of Task retry") {
     try {
-      KafkaDataConsumer.cache.clear()
-
       val kafkaParams = getKafkaParams()
       val key = new CacheKey(groupId, topicPartition)
 
       val context1 = new TaskContextImpl(0, 0, 0, 0, 0, null, null, null)
       TaskContext.setTaskContext(context1)
-      val consumer1 = KafkaDataConsumer.acquire(topicPartition, kafkaParams, true)
+      val consumer1 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+
+      // any method call which requires consumer is necessary
+      consumer1.getAvailableOffsetRange()
+
+      val consumer1Underlying = consumer1._consumer
+      assert(consumer1Underlying.isDefined)
+
       consumer1.release()
 
-      assert(KafkaDataConsumer.cache.size() == 1)
-      assert(KafkaDataConsumer.cache.get(key).eq(consumer1.internalConsumer))
+      assert(consumerPool.getTotal(key) === 1)
+      val pooledObj = consumerPool.borrowObject(key, kafkaParams)
+      assert(consumer1Underlying.get.eq(pooledObj))
+      consumerPool.returnObject(pooledObj)
 
       val context2 = new TaskContextImpl(0, 0, 0, 0, 1, null, null, null)
       TaskContext.setTaskContext(context2)
-      val consumer2 = KafkaDataConsumer.acquire(topicPartition, kafkaParams, true)
+      val consumer2 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+
+      // any method call which requires consumer is necessary
+      consumer2.getAvailableOffsetRange()
+
+      val consumer2Underlying = consumer2._consumer
+      assert(consumer2Underlying.isDefined)
+      // here we expect different consumer as pool will invalidate for task reattempt
+      assert(consumer2Underlying.get.ne(consumer1Underlying.get))
+
       consumer2.release()
 
-      // The first consumer should be removed from cache and new non-cached should be returned
-      assert(KafkaDataConsumer.cache.size() == 0)
-      assert(consumer1.internalConsumer.ne(consumer2.internalConsumer))
+      // The first consumer should be removed from cache, but second consumer should be cached.
+      assert(consumerPool.getTotal(key) === 1)
+      val pooledObj2 = consumerPool.borrowObject(key, kafkaParams)
+      assert(consumer2Underlying.get.eq(pooledObj2))
+      consumerPool.returnObject(pooledObj2)
     } finally {
       TaskContext.unset()
     }
   }
 
   test("SPARK-23623: concurrent use of KafkaDataConsumer") {
-    val data = (1 to 1000).map(_.toString)
-    testUtils.createTopic(topic, 1)
-    testUtils.sendMessages(topic, data.toArray)
+    val data: immutable.IndexedSeq[String] = prepareTestTopicHavingTestMessages(topic)
 
+    val topicPartition = new TopicPartition(topic, 0)
     val kafkaParams = getKafkaParams()
     val numThreads = 100
     val numConsumerUsages = 500
@@ -110,14 +145,13 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
     @volatile var error: Throwable = null
 
     def consume(i: Int): Unit = {
-      val useCache = Random.nextBoolean
       val taskContext = if (Random.nextBoolean) {
         new TaskContextImpl(0, 0, 0, 0, attemptNumber = Random.nextInt(2), null, null, null)
       } else {
         null
       }
       TaskContext.setTaskContext(taskContext)
-      val consumer = KafkaDataConsumer.acquire(topicPartition, kafkaParams, useCache)
+      val consumer = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
       try {
         val range = consumer.getAvailableOffsetRange()
         val rcvd = range.earliest until range.latest map { offset =>
@@ -147,4 +181,143 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
       threadpool.shutdown()
     }
   }
+
+  test("SPARK-25151 Handles multiple tasks in executor fetching same (topic, partition) pair") {
+    prepareTestTopicHavingTestMessages(topic)
+    val topicPartition = new TopicPartition(topic, 0)
+
+    val kafkaParams = getKafkaParams()
+
+    withTaskContext(TaskContext.empty()) {
+      // task A trying to fetch offset 0 to 100, and read 5 records
+      val consumer1 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      val lastOffsetForConsumer1 = readAndGetLastOffset(consumer1, 0, 100, 5)
+      consumer1.release()
+
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+
+      // task B trying to fetch offset 300 to 500, and read 5 records
+      val consumer2 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      val lastOffsetForConsumer2 = readAndGetLastOffset(consumer2, 300, 500, 5)
+      consumer2.release()
+
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+
+      // task A continue reading from the last offset + 1, with upper bound 100 again
+      val consumer1a = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+
+      consumer1a.get(lastOffsetForConsumer1 + 1, 100, 10000, failOnDataLoss = false)
+      consumer1a.release()
+
+      // pool should succeed to provide cached data instead of creating one
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+
+      // task B also continue reading from the last offset + 1, with upper bound 500 again
+      val consumer2a = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+
+      consumer2a.get(lastOffsetForConsumer2 + 1, 500, 10000, failOnDataLoss = false)
+      consumer2a.release()
+
+      // same expectation: pool should succeed to provide cached data instead of creating one
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+    }
+  }
+
+  test("SPARK-25151 Handles multiple tasks in executor fetching same (topic, partition) pair " +
+    "and same offset (edge-case) - data in use") {
+    prepareTestTopicHavingTestMessages(topic)
+    val topicPartition = new TopicPartition(topic, 0)
+
+    val kafkaParams = getKafkaParams()
+
+    withTaskContext(TaskContext.empty()) {
+      // task A trying to fetch offset 0 to 100, and read 5 records (still reading)
+      val consumer1 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      val lastOffsetForConsumer1 = readAndGetLastOffset(consumer1, 0, 100, 5)
+
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+
+      // task B trying to fetch offset the last offset task A is reading so far + 1 to 500
+      // this is a condition for edge case
+      val consumer2 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      consumer2.get(lastOffsetForConsumer1 + 1, 100, 10000, failOnDataLoss = false)
+
+      // Pool must create a new fetched data instead of returning existing on now in use even
+      // there's fetched data matching start offset.
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 2, expectedNumTotal = 2)
+
+      consumer1.release()
+      consumer2.release()
+    }
+  }
+
+  test("SPARK-25151 Handles multiple tasks in executor fetching same (topic, partition) pair " +
+    "and same offset (edge-case) - data not in use") {
+    prepareTestTopicHavingTestMessages(topic)
+    val topicPartition = new TopicPartition(topic, 0)
+
+    val kafkaParams = getKafkaParams()
+
+    withTaskContext(TaskContext.empty()) {
+      // task A trying to fetch offset 0 to 100, and read 5 records (still reading)
+      val consumer1 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      val lastOffsetForConsumer1 = readAndGetLastOffset(consumer1, 0, 100, 5)
+      consumer1.release()
+
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+
+      // task B trying to fetch offset the last offset task A is reading so far + 1 to 500
+      // this is a condition for edge case
+      val consumer2 = KafkaDataConsumer.acquire(topicPartition, kafkaParams)
+      consumer2.get(lastOffsetForConsumer1 + 1, 100, 10000, failOnDataLoss = false)
+
+      // Pool cannot determine the origin task, so it has to just provide matching one.
+      // task A may come back and try to fetch, and cannot find previous data
+      // (or the data is in use).
+      // If then task A may have to fetch from Kafka, but we already avoided fetching from Kafka in
+      // task B, so it is not a big deal in overall.
+      assertFetchedDataPoolStatistic(fetchedDataPool, expectedNumCreated = 1, expectedNumTotal = 1)
+
+      consumer2.release()
+    }
+  }
+
+  private def assertFetchedDataPoolStatistic(
+      fetchedDataPool: FetchedDataPool,
+      expectedNumCreated: Long,
+      expectedNumTotal: Long): Unit = {
+    assert(fetchedDataPool.getNumCreated === expectedNumCreated)
+    assert(fetchedDataPool.getNumTotal === expectedNumTotal)
+  }
+
+  private def readAndGetLastOffset(
+      consumer: KafkaDataConsumer,
+      startOffset: Long,
+      untilOffset: Long,
+      numToRead: Int): Long = {
+    var lastOffset: Long = startOffset - 1
+    (0 until numToRead).foreach { _ =>
+      val record = consumer.get(lastOffset + 1, untilOffset, 10000, failOnDataLoss = false)
+      // validation for fetched record is covered by other tests, so skip on validating
+      lastOffset = record.offset()
+    }
+    lastOffset
+  }
+
+  private def prepareTestTopicHavingTestMessages(topic: String) = {
+    val data = (1 to 1000).map(_.toString)
+    testUtils.createTopic(topic, 1)
+    testUtils.sendMessages(topic, data.toArray)
+    data
+  }
+
+  private def withTaskContext(context: TaskContext)(task: => Unit): Unit = {
+    try {
+      TaskContext.setTaskContext(context)
+      task
+    } finally {
+      TaskContext.unset()
+    }
+  }
+
 }
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
index 8663a5d8d26c..ae8a6886b2b4 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
@@ -1146,7 +1146,6 @@ class KafkaMicroBatchV2SourceSuite extends KafkaMicroBatchSourceSuiteBase {
           KafkaSourceOffset(Map(tp -> 100L))).map(_.asInstanceOf[KafkaBatchInputPartition])
         withClue(s"minPartitions = $minPartitions generated factories $inputPartitions\n\t") {
           assert(inputPartitions.size == numPartitionsGenerated)
-          inputPartitions.foreach { f => assert(f.reuseKafkaConsumer == reusesConsumers) }
         }
       }
     }
diff --git a/pom.xml b/pom.xml
index 6a8424cc1328..17947451ea38 100644
--- a/pom.xml
+++ b/pom.xml
@@ -180,6 +180,8 @@
     <commons-lang2.version>2.6</commons-lang2.version>
     <!-- org.apache.commons/commons-lang3/-->
     <commons-lang3.version>3.8.1</commons-lang3.version>
+    <!-- org.apache.commons/commons-pool2/-->
+    <commons-pool2.version>2.6.2</commons-pool2.version>
     <datanucleus-core.version>3.2.10</datanucleus-core.version>
     <janino.version>3.0.15</janino.version>
     <jersey.version>2.29</jersey.version>

From 8cb52e39092e74a1db35ee909c5f93ccda9d1e55 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Tue, 27 Aug 2019 06:23:49 +0900
Subject: [PATCH 02/13] Address review comments

---
 .../spark/sql/kafka010/FetchedDataPool.scala  | 64 ++++++++-----------
 .../kafka010/InternalKafkaConsumerPool.scala  | 25 ++++----
 .../sql/kafka010/KafkaDataConsumer.scala      |  6 +-
 .../sql/kafka010/FetchedDataPoolSuite.scala   | 10 +--
 .../InternalKafkaConsumerPoolSuite.scala      | 30 ++++-----
 .../sql/kafka010/KafkaDataConsumerSuite.scala | 12 ++--
 6 files changed, 70 insertions(+), 77 deletions(-)

diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
index a408c27d21f8..d58dfc222525 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -22,14 +22,13 @@ import java.util.concurrent.{ScheduledFuture, TimeUnit}
 import java.util.concurrent.atomic.LongAdder
 
 import scala.collection.mutable
-import scala.util.control.NonFatal
 
 import org.apache.kafka.clients.consumer.ConsumerRecord
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.{CacheKey, UNKNOWN_OFFSET}
-import org.apache.spark.util.ThreadUtils
+import org.apache.spark.util.{ThreadUtils, Utils}
 
 /**
  * Provides object pool for [[FetchedData]] which is grouped by [[CacheKey]].
@@ -46,12 +45,8 @@ private[kafka010] class FetchedDataPool extends Logging {
   private val (minEvictableIdleTimeMillis, evictorThreadRunIntervalMillis): (Long, Long) = {
     val conf = SparkEnv.get.conf
 
-    val minEvictIdleTime = conf.getLong(CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS,
-      DEFAULT_VALUE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
-
-    val evictorThreadInterval = conf.getLong(
-      CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS,
-      DEFAULT_VALUE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
+    val minEvictIdleTime = conf.get(CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
+    val evictorThreadInterval = conf.get(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
 
     (minEvictIdleTime, evictorThreadInterval)
   }
@@ -62,12 +57,7 @@ private[kafka010] class FetchedDataPool extends Logging {
   private def startEvictorThread(): ScheduledFuture[_] = {
     executorService.scheduleAtFixedRate(new Runnable {
       override def run(): Unit = {
-        try {
-          removeIdleFetchedData()
-        } catch {
-          case NonFatal(e) =>
-            logWarning("Exception occurred while removing idle fetched data.", e)
-        }
+        Utils.tryLogNonFatalError(removeIdleFetchedData())
       }
     }, 0, evictorThreadRunIntervalMillis, TimeUnit.MILLISECONDS)
   }
@@ -77,8 +67,8 @@ private[kafka010] class FetchedDataPool extends Logging {
   private val numCreatedFetchedData = new LongAdder()
   private val numTotalElements = new LongAdder()
 
-  def getNumCreated: Long = numCreatedFetchedData.sum()
-  def getNumTotal: Long = numTotalElements.sum()
+  def numCreated: Long = numCreatedFetchedData.sum()
+  def numTotal: Long = numTotalElements.sum()
 
   def acquire(key: CacheKey, desiredStartOffset: Long): FetchedData = synchronized {
     val fetchedDataList = cache.getOrElseUpdate(key, new CachedFetchedDataList())
@@ -112,25 +102,32 @@ private[kafka010] class FetchedDataPool extends Logging {
   }
 
   def release(key: CacheKey, fetchedData: FetchedData): Unit = synchronized {
+    def warnReleasedDataNotInPool(key: CacheKey, fetchedData: FetchedData): Unit = {
+      logWarning(s"No matching data in pool for $fetchedData in key $key. " +
+        "It might be released before, or it was not a part of pool.")
+    }
+
     cache.get(key) match {
       case Some(fetchedDataList) =>
         val cachedFetchedDataOption = fetchedDataList.find { p =>
           p.inUse && p.getObject == fetchedData
         }
 
-        if (cachedFetchedDataOption.isDefined) {
+        if (cachedFetchedDataOption.isEmpty) {
+          warnReleasedDataNotInPool(key, fetchedData)
+        } else {
           val cachedFetchedData = cachedFetchedDataOption.get
           cachedFetchedData.inUse = false
-          cachedFetchedData.lastReleasedTimestamp = System.currentTimeMillis()
+          cachedFetchedData.lastReleasedTimestamp = System.nanoTime()
         }
 
-      case None => logWarning(s"No matching data in pool for $fetchedData in key $key. " +
-        "It might be released before, or it was not a part of pool.")
+      case None =>
+        warnReleasedDataNotInPool(key, fetchedData)
     }
   }
 
   def shutdown(): Unit = {
-    executorService.shutdownNow()
+    ThreadUtils.shutdown(executorService)
   }
 
   def reset(): Unit = synchronized {
@@ -144,13 +141,17 @@ private[kafka010] class FetchedDataPool extends Logging {
   }
 
   private def removeIdleFetchedData(): Unit = synchronized {
-    val timestamp = System.currentTimeMillis()
-    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeMillis
+    val timestamp = System.nanoTime()
+    val minEvictableIdleTimeNanos = TimeUnit.MILLISECONDS.toNanos(minEvictableIdleTimeMillis)
+    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeNanos
     cache.values.foreach { p: CachedFetchedDataList =>
-      val idles = p.filter(q => !q.inUse && q.lastReleasedTimestamp < maxAllowedIdleTimestamp)
-      val lstSize = p.size
-      idles.foreach(idle => p -= idle)
-      numTotalElements.add(-1 * (lstSize - p.size))
+      val expired = p.filter {
+        q => !q.inUse && q.lastReleasedTimestamp < maxAllowedIdleTimestamp
+      }
+      expired.foreach {
+        idle => p -= idle
+      }
+      numTotalElements.add(-1 * expired.size)
     }
   }
 }
@@ -177,14 +178,5 @@ private[kafka010] object FetchedDataPool {
 
   private[kafka010] type CachedFetchedDataList = mutable.ListBuffer[CachedFetchedData]
 
-  val CONFIG_NAME_PREFIX = "spark.sql.kafkaFetchedDataCache."
-  val CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS = CONFIG_NAME_PREFIX +
-    "minEvictableIdleTimeMillis"
-  val CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS = CONFIG_NAME_PREFIX +
-    "evictorThreadRunIntervalMillis"
-
-  val DEFAULT_VALUE_MIN_EVICTABLE_IDLE_TIME_MILLIS = 10 * 60 * 1000 // 10 minutes
-  val DEFAULT_VALUE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS = 5 * 60 * 1000 // 3 minutes
-
   def build: FetchedDataPool = new FetchedDataPool()
 }
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
index f268508a7c61..fea4831333b7 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
@@ -52,7 +52,7 @@ private[kafka010] class InternalKafkaConsumerPool(
   // the class is intended to have only soft capacity
   assert(poolConfig.getMaxTotal < 0)
 
-  private lazy val pool = {
+  private val pool = {
     val internalPool = new GenericKeyedObjectPool[CacheKey, InternalKafkaConsumer](
       objectFactory, poolConfig)
     internalPool.setSwallowedExceptionListener(CustomSwallowedExceptionListener)
@@ -72,7 +72,7 @@ private[kafka010] class InternalKafkaConsumerPool(
   def borrowObject(key: CacheKey, kafkaParams: ju.Map[String, Object]): InternalKafkaConsumer = {
     updateKafkaParamForKey(key, kafkaParams)
 
-    if (getTotal == poolConfig.getSoftMaxTotal()) {
+    if (size == poolConfig.softMaxSize()) {
       pool.clearOldest()
     }
 
@@ -111,17 +111,17 @@ private[kafka010] class InternalKafkaConsumerPool(
     pool.clear()
   }
 
-  def getNumIdle: Int = pool.getNumIdle
+  def numIdle: Int = pool.getNumIdle
 
-  def getNumIdle(key: CacheKey): Int = pool.getNumIdle(key)
+  def numIdle(key: CacheKey): Int = pool.getNumIdle(key)
 
-  def getNumActive: Int = pool.getNumActive
+  def numActive: Int = pool.getNumActive
 
-  def getNumActive(key: CacheKey): Int = pool.getNumActive(key)
+  def numActive(key: CacheKey): Int = pool.getNumActive(key)
 
-  def getTotal: Int = getNumIdle + getNumActive
+  def size: Int = numIdle + numActive
 
-  def getTotal(key: CacheKey): Int = getNumIdle(key) + getNumActive(key)
+  def size(key: CacheKey): Int = numIdle(key) + numActive(key)
 
   private def updateKafkaParamForKey(key: CacheKey, kafkaParams: ju.Map[String, Object]): Unit = {
     // We can assume that kafkaParam should not be different for same cache key,
@@ -155,16 +155,16 @@ private[kafka010] object InternalKafkaConsumerPool {
   }
 
   class PoolConfig extends GenericKeyedObjectPoolConfig[InternalKafkaConsumer] {
-    private var softMaxTotal = Int.MaxValue
+    private var _softMaxSize = Int.MaxValue
 
-    def getSoftMaxTotal(): Int = softMaxTotal
+    def softMaxSize(): Int = _softMaxSize
 
     init()
 
     def init(): Unit = {
       val conf = SparkEnv.get.conf
 
-      softMaxTotal = conf.get(CONSUMER_CACHE_CAPACITY)
+      _softMaxSize = conf.get(CONSUMER_CACHE_CAPACITY)
 
       val jmxEnabled = conf.get(CONSUMER_CACHE_JMX_ENABLED)
       val minEvictableIdleTimeMillis = conf.get(CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
@@ -203,8 +203,7 @@ private[kafka010] object InternalKafkaConsumerPool {
   class ObjectFactory extends BaseKeyedPooledObjectFactory[CacheKey, InternalKafkaConsumer]
     with Logging {
 
-    val keyToKafkaParams: ConcurrentHashMap[CacheKey, ju.Map[String, Object]] =
-      new ConcurrentHashMap[CacheKey, ju.Map[String, Object]]()
+    val keyToKafkaParams = new ConcurrentHashMap[CacheKey, ju.Map[String, Object]]()
 
     override def create(key: CacheKey): InternalKafkaConsumer = {
       Option(keyToKafkaParams.get(key)) match {
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
index 9e98ae562937..0cba9f7e59eb 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
@@ -46,7 +46,7 @@ private[kafka010] class InternalKafkaConsumer(
 
   val groupId = kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String]
 
-  private val consumer = createConsumer
+  private val consumer = createConsumer()
 
   /**
    * Poll messages from Kafka starting from `offset` and returns a pair of "list of consumer record"
@@ -59,7 +59,7 @@ private[kafka010] class InternalKafkaConsumer(
    *                          consumer polls nothing before timeout.
    */
   def fetch(offset: Long, pollTimeoutMs: Long):
-    (ju.List[ConsumerRecord[Array[Byte], Array[Byte]]], Long) = {
+      (ju.List[ConsumerRecord[Array[Byte], Array[Byte]]], Long) = {
 
     // Seek to the offset because we may call seekToBeginning or seekToEnd before this.
     seek(offset)
@@ -105,7 +105,7 @@ private[kafka010] class InternalKafkaConsumer(
   }
 
   /** Create a KafkaConsumer to fetch records for `topicPartition` */
-  private def createConsumer: KafkaConsumer[Array[Byte], Array[Byte]] = {
+  private def createConsumer(): KafkaConsumer[Array[Byte], Array[Byte]] = {
     val updatedKafkaParams = KafkaConfigUpdater("executor", kafkaParams.asScala.toMap)
       .setAuthenticationConfigIfNeeded()
       .build()
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
index ad3975d673f3..c80b0adb1378 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -203,15 +203,15 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("evict idle fetched data") {
-    import FetchedDataPool._
     import org.scalatest.time.SpanSugar._
 
     val minEvictableIdleTimeMillis = 1000
     val evictorThreadRunIntervalMillis = 500
 
     val newConf = Seq(
-      CONFIG_NAME_MIN_EVICTABLE_IDLE_TIME_MILLIS -> minEvictableIdleTimeMillis.toString,
-      CONFIG_NAME_EVICTOR_THREAD_RUN_INTERVAL_MILLIS -> evictorThreadRunIntervalMillis.toString)
+      CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS.key -> minEvictableIdleTimeMillis.toString,
+      CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS.key ->
+        evictorThreadRunIntervalMillis.toString)
 
     withSparkConf(newConf: _*) {
       val dataPool = FetchedDataPool.build
@@ -331,7 +331,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
       fetchedDataPool: FetchedDataPool,
       expectedNumCreated: Long,
       expectedNumTotal: Long): Unit = {
-    assert(fetchedDataPool.getNumCreated === expectedNumCreated)
-    assert(fetchedDataPool.getNumTotal === expectedNumTotal)
+    assert(fetchedDataPool.numCreated === expectedNumCreated)
+    assert(fetchedDataPool.numTotal === expectedNumTotal)
   }
 }
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
index 7aa13b7042e3..497c784c238e 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
@@ -125,11 +125,11 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
       assertPoolStateForKey(pool, newCacheKey, numIdle = 0, numActive = 1, numTotal = 1)
 
       // at least one of idle object should be freed up
-      assert(pool.getNumIdle < numToReturn)
+      assert(pool.numIdle < numToReturn)
       // we can determine number of active objects correctly
-      assert(pool.getNumActive === keyToPooledObjectPairs.length - numToReturn + 1)
+      assert(pool.numActive === keyToPooledObjectPairs.length - numToReturn + 1)
       // total objects should be more than number of active + 1 but can't expect exact number
-      assert(pool.getTotal > keyToPooledObjectPairs.length - numToReturn + 1)
+      assert(pool.size > keyToPooledObjectPairs.length - numToReturn + 1)
     }
   }
 
@@ -231,9 +231,9 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
       numIdle: Int,
       numActive: Int,
       numTotal: Int): Unit = {
-    assert(pool.getNumIdle === numIdle)
-    assert(pool.getNumActive === numActive)
-    assert(pool.getTotal === numTotal)
+    assert(pool.numIdle === numIdle)
+    assert(pool.numActive === numActive)
+    assert(pool.size === numTotal)
   }
 
   private def assertPoolStateForKey(
@@ -242,9 +242,9 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
       numIdle: Int,
       numActive: Int,
       numTotal: Int): Unit = {
-    assert(pool.getNumIdle(key) === numIdle)
-    assert(pool.getNumActive(key) === numActive)
-    assert(pool.getTotal(key) === numTotal)
+    assert(pool.numIdle(key) === numIdle)
+    assert(pool.numActive(key) === numActive)
+    assert(pool.size(key) === numTotal)
   }
 
   private def getTestKafkaParams: ju.Map[String, Object] = Map[String, Object](
@@ -261,9 +261,9 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
       kafkaParams: ju.Map[String, Object],
       keys: List[CacheKey]): Seq[(CacheKey, InternalKafkaConsumer)] = {
     keys.map { key =>
-      val numActiveBeforeBorrowing = pool.getNumActive
-      val numIdleBeforeBorrowing = pool.getNumIdle
-      val numTotalBeforeBorrowing = pool.getTotal
+      val numActiveBeforeBorrowing = pool.numActive
+      val numIdleBeforeBorrowing = pool.numIdle
+      val numTotalBeforeBorrowing = pool.size
 
       val pooledObj = pool.borrowObject(key, kafkaParams)
 
@@ -279,9 +279,9 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
       pool: InternalKafkaConsumerPool,
       objects: Seq[(CacheKey, InternalKafkaConsumer)]): Unit = {
     objects.foreach { case (key, pooledObj) =>
-      val numActiveBeforeReturning = pool.getNumActive
-      val numIdleBeforeReturning = pool.getNumIdle
-      val numTotalBeforeReturning = pool.getTotal
+      val numActiveBeforeReturning = pool.numActive
+      val numIdleBeforeReturning = pool.numIdle
+      val numTotalBeforeReturning = pool.size
 
       pool.returnObject(pooledObj)
 
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
index 3c89f5f7efd6..80f9a1b410d2 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDataConsumerSuite.scala
@@ -105,7 +105,8 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
 
       consumer1.release()
 
-      assert(consumerPool.getTotal(key) === 1)
+      assert(consumerPool.size(key) === 1)
+      // check whether acquired object is available in pool
       val pooledObj = consumerPool.borrowObject(key, kafkaParams)
       assert(consumer1Underlying.get.eq(pooledObj))
       consumerPool.returnObject(pooledObj)
@@ -124,8 +125,9 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
 
       consumer2.release()
 
-      // The first consumer should be removed from cache, but second consumer should be cached.
-      assert(consumerPool.getTotal(key) === 1)
+      // The first consumer should be removed from cache, but the consumer after invalidate
+      // should be cached.
+      assert(consumerPool.size(key) === 1)
       val pooledObj2 = consumerPool.borrowObject(key, kafkaParams)
       assert(consumer2Underlying.get.eq(pooledObj2))
       consumerPool.returnObject(pooledObj2)
@@ -286,8 +288,8 @@ class KafkaDataConsumerSuite extends SharedSparkSession with PrivateMethodTester
       fetchedDataPool: FetchedDataPool,
       expectedNumCreated: Long,
       expectedNumTotal: Long): Unit = {
-    assert(fetchedDataPool.getNumCreated === expectedNumCreated)
-    assert(fetchedDataPool.getNumTotal === expectedNumTotal)
+    assert(fetchedDataPool.numCreated === expectedNumCreated)
+    assert(fetchedDataPool.numTotal === expectedNumTotal)
   }
 
   private def readAndGetLastOffset(

From 9543745bc41b2adf258a8a91e3c5aab59c5d0cbd Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Tue, 27 Aug 2019 14:19:18 +0900
Subject: [PATCH 03/13] Modify eviction UT to leverage manual scheduler and
 clock

---
 external/kafka-0-10-sql/pom.xml               |  5 ++
 .../spark/sql/kafka010/FetchedDataPool.scala  | 36 ++++++-----
 .../sql/kafka010/FetchedDataPoolSuite.scala   | 60 ++++++++++++++-----
 3 files changed, 72 insertions(+), 29 deletions(-)

diff --git a/external/kafka-0-10-sql/pom.xml b/external/kafka-0-10-sql/pom.xml
index feba787e9901..5b8738263a60 100644
--- a/external/kafka-0-10-sql/pom.xml
+++ b/external/kafka-0-10-sql/pom.xml
@@ -130,6 +130,11 @@
       <groupId>org.apache.spark</groupId>
       <artifactId>spark-tags_${scala.binary.version}</artifactId>
     </dependency>
+    <dependency>
+      <groupId>org.jmock</groupId>
+      <artifactId>jmock-junit4</artifactId>
+      <scope>test</scope>
+    </dependency>
 
     <!--
       This spark-tags test-dep is needed even though it isn't used in this module, otherwise testing-cmds that exclude
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
index d58dfc222525..eb8a41f0ba2b 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.kafka010
 
 import java.{util => ju}
-import java.util.concurrent.{ScheduledFuture, TimeUnit}
+import java.util.concurrent.{ScheduledExecutorService, ScheduledFuture, TimeUnit}
 import java.util.concurrent.atomic.LongAdder
 
 import scala.collection.mutable
@@ -28,7 +28,7 @@ import org.apache.kafka.clients.consumer.ConsumerRecord
 import org.apache.spark.SparkEnv
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.{CacheKey, UNKNOWN_OFFSET}
-import org.apache.spark.util.{ThreadUtils, Utils}
+import org.apache.spark.util.{Clock, SystemClock, ThreadUtils, Utils}
 
 /**
  * Provides object pool for [[FetchedData]] which is grouped by [[CacheKey]].
@@ -37,7 +37,9 @@ import org.apache.spark.util.{ThreadUtils, Utils}
  * may be stored from previous batch. If it can't find one to match, it will create
  * a new FetchedData.
  */
-private[kafka010] class FetchedDataPool extends Logging {
+private[kafka010] class FetchedDataPool(
+    executorService: ScheduledExecutorService,
+    clock: Clock) extends Logging {
   import FetchedDataPool._
 
   private val cache: mutable.Map[CacheKey, CachedFetchedDataList] = mutable.HashMap.empty
@@ -51,9 +53,6 @@ private[kafka010] class FetchedDataPool extends Logging {
     (minEvictIdleTime, evictorThreadInterval)
   }
 
-  private val executorService = ThreadUtils.newDaemonSingleThreadScheduledExecutor(
-    "kafka-fetched-data-cache-evictor")
-
   private def startEvictorThread(): ScheduledFuture[_] = {
     executorService.scheduleAtFixedRate(new Runnable {
       override def run(): Unit = {
@@ -88,7 +87,7 @@ private[kafka010] class FetchedDataPool extends Logging {
       numTotalElements.increment()
     }
 
-    cachedFetchedData.lastAcquiredTimestamp = System.currentTimeMillis()
+    cachedFetchedData.lastAcquiredTimestamp = clock.getTimeMillis()
     cachedFetchedData.inUse = true
 
     cachedFetchedData.getObject
@@ -118,7 +117,7 @@ private[kafka010] class FetchedDataPool extends Logging {
         } else {
           val cachedFetchedData = cachedFetchedDataOption.get
           cachedFetchedData.inUse = false
-          cachedFetchedData.lastReleasedTimestamp = System.nanoTime()
+          cachedFetchedData.lastReleasedTimestamp = clock.getTimeMillis()
         }
 
       case None =>
@@ -141,12 +140,14 @@ private[kafka010] class FetchedDataPool extends Logging {
   }
 
   private def removeIdleFetchedData(): Unit = synchronized {
-    val timestamp = System.nanoTime()
-    val minEvictableIdleTimeNanos = TimeUnit.MILLISECONDS.toNanos(minEvictableIdleTimeMillis)
-    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeNanos
+    val timestamp = clock.getTimeMillis()
+    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeMillis
     cache.values.foreach { p: CachedFetchedDataList =>
-      val expired = p.filter {
-        q => !q.inUse && q.lastReleasedTimestamp < maxAllowedIdleTimestamp
+      val expired = p.filter { q =>
+        // also check timestamp is bigger than last released timestamp to avoid
+        // the case System.currentTimeInMillis looking as "move back"
+        !q.inUse && timestamp > q.lastReleasedTimestamp &&
+          q.lastReleasedTimestamp < maxAllowedIdleTimestamp
       }
       expired.foreach {
         idle => p -= idle
@@ -178,5 +179,12 @@ private[kafka010] object FetchedDataPool {
 
   private[kafka010] type CachedFetchedDataList = mutable.ListBuffer[CachedFetchedData]
 
-  def build: FetchedDataPool = new FetchedDataPool()
+  def build(executorService: ScheduledExecutorService, clock: Clock): FetchedDataPool = {
+    new FetchedDataPool(executorService, clock)
+  }
+
+  def build: FetchedDataPool = {
+    build(ThreadUtils.newDaemonSingleThreadScheduledExecutor(
+      "kafka-fetched-data-cache-evictor"), new SystemClock)
+  }
 }
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
index c80b0adb1378..4829fa9908c2 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -18,17 +18,20 @@
 package org.apache.spark.sql.kafka010
 
 import java.{util => ju}
+import java.util.concurrent.TimeUnit
 
 import scala.collection.JavaConverters._
 import scala.collection.mutable
 
 import org.apache.kafka.clients.consumer.ConsumerRecord
 import org.apache.kafka.common.TopicPartition
+import org.jmock.lib.concurrent.DeterministicScheduler
 import org.scalatest.PrivateMethodTester
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
 import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.ManualClock
 
 class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   import FetchedDataPool._
@@ -203,9 +206,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("evict idle fetched data") {
-    import org.scalatest.time.SpanSugar._
-
-    val minEvictableIdleTimeMillis = 1000
+    val minEvictableIdleTimeMillis = 2000
     val evictorThreadRunIntervalMillis = 500
 
     val newConf = Seq(
@@ -214,7 +215,9 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
         evictorThreadRunIntervalMillis.toString)
 
     withSparkConf(newConf: _*) {
-      val dataPool = FetchedDataPool.build
+      val scheduler = new DeterministicScheduler()
+      val clock = new ManualClock()
+      val dataPool = FetchedDataPool.build(scheduler, clock)
 
       val cacheKeys = (0 until 10).map { partId =>
         CacheKey("testgroup", new TopicPartition("topic", partId))
@@ -229,19 +232,38 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
       }
 
       val dataToEvict = dataList.take(3)
+      // release key with around 500 ms delay, so that we can check eviction per key
       dataToEvict.foreach { case (key, data) =>
         dataPool.release(key, data)
+        clock.advance(500)
       }
 
-      // wait up to twice than minEvictableIdleTimeMillis to ensure evictor thread to clear up
-      // idle objects
-      eventually(timeout((minEvictableIdleTimeMillis.toLong * 2).milliseconds),
-        interval(evictorThreadRunIntervalMillis.milliseconds)) {
-        // idle objects should be evicted
-        dataToEvict.map { case (key, _) =>
-          assert(getCache(dataPool)(key).isEmpty)
-        }
-      }
+      // time elapsed after releasing
+      // first key: 1500ms, second key: 1000 ms, third key: 500 ms
+
+      // advancing - first key: 2100ms, second key: 1600 ms, third key: 1100 ms
+      clock.advance(600)
+
+      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+      assert(getCache(dataPool)(dataToEvict(1)._1).nonEmpty)
+      assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
+
+      // advancing - second key: 2100 ms, third key: 1600 ms
+      clock.advance(500)
+
+      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+      assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
+      assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
+
+      // advancing - third key: 2300 ms
+      clock.advance(500)
+
+      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+      assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
+      assert(getCache(dataPool)(dataToEvict(2)._1).isEmpty)
 
       assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
       assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
@@ -250,11 +272,19 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
         dataPool.release(key, data)
       }
 
-      // ensure releasing more objects don't trigger eviction immediately
+      // add objects to be candidates for eviction
+      clock.advance(minEvictableIdleTimeMillis + 100)
+
+      // ensure releasing more objects don't trigger eviction unless evictor runs
       assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
       assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
 
-      dataPool.shutdown()
+      try {
+        dataPool.shutdown()
+      } catch {
+        // ignore as it's known issue, DeterministicScheduler doesn't support shutdown
+        case _: UnsupportedOperationException =>
+      }
     }
   }
 

From 2ac46e44253a11e755798372eebacf89a359987f Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Tue, 27 Aug 2019 14:29:04 +0900
Subject: [PATCH 04/13] Elaborate why FetchedDataPool is necessary

---
 .../scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
index eb8a41f0ba2b..a73f1d67fb0b 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -35,7 +35,9 @@ import org.apache.spark.util.{Clock, SystemClock, ThreadUtils, Utils}
  *
  * Along with CacheKey, it receives desired start offset to find cached FetchedData which
  * may be stored from previous batch. If it can't find one to match, it will create
- * a new FetchedData.
+ * a new FetchedData. As "desired start offset" plays as second level of key which can be
+ * modified in same instance, this class cannot be replaced with general pool implementations
+ * including Apache Commons Pool which pools KafkaConsumer.
  */
 private[kafka010] class FetchedDataPool(
     executorService: ScheduledExecutorService,

From 25d7a527a062170e772ee234378ee9517ba6cd58 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Wed, 28 Aug 2019 10:38:16 +0900
Subject: [PATCH 05/13] Address review comments so far

---
 .../scala/org/apache/spark/SparkConf.scala    |   4 +-
 .../spark/sql/kafka010/FetchedDataPool.scala  |  50 +++---
 .../kafka010/InternalKafkaConsumerPool.scala  |  26 ++-
 .../sql/kafka010/KafkaDataConsumer.scala      |  20 ++-
 .../apache/spark/sql/kafka010/package.scala   |  33 ++--
 .../sql/kafka010/FetchedDataPoolSuite.scala   | 151 ++++++++----------
 .../InternalKafkaConsumerPoolSuite.scala      | 109 +++++--------
 7 files changed, 171 insertions(+), 222 deletions(-)

diff --git a/core/src/main/scala/org/apache/spark/SparkConf.scala b/core/src/main/scala/org/apache/spark/SparkConf.scala
index 24be54ec9182..bc3a4affac50 100644
--- a/core/src/main/scala/org/apache/spark/SparkConf.scala
+++ b/core/src/main/scala/org/apache/spark/SparkConf.scala
@@ -714,9 +714,7 @@ private[spark] object SparkConf extends Logging {
       AlternateConfig("spark.yarn.kerberos.relogin.period", "3.0")),
     KERBEROS_FILESYSTEMS_TO_ACCESS.key -> Seq(
       AlternateConfig("spark.yarn.access.namenodes", "2.2"),
-      AlternateConfig("spark.yarn.access.hadoopFileSystems", "3.0")),
-    "spark.kafka.consumer.cache.capacity" -> Seq(
-      AlternateConfig("spark.sql.kafkaConsumerCache.capacity", "3.0"))
+      AlternateConfig("spark.yarn.access.hadoopFileSystems", "3.0"))
   )
 
   /**
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
index a73f1d67fb0b..506e8e89e4c9 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -25,7 +25,7 @@ import scala.collection.mutable
 
 import org.apache.kafka.clients.consumer.ConsumerRecord
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.SparkConf
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.{CacheKey, UNKNOWN_OFFSET}
 import org.apache.spark.util.{Clock, SystemClock, ThreadUtils, Utils}
@@ -41,25 +41,25 @@ import org.apache.spark.util.{Clock, SystemClock, ThreadUtils, Utils}
  */
 private[kafka010] class FetchedDataPool(
     executorService: ScheduledExecutorService,
-    clock: Clock) extends Logging {
+    clock: Clock,
+    conf: SparkConf) extends Logging {
   import FetchedDataPool._
 
-  private val cache: mutable.Map[CacheKey, CachedFetchedDataList] = mutable.HashMap.empty
-
-  private val (minEvictableIdleTimeMillis, evictorThreadRunIntervalMillis): (Long, Long) = {
-    val conf = SparkEnv.get.conf
+  def this(sparkConf: SparkConf) = {
+    this(
+      ThreadUtils.newDaemonSingleThreadScheduledExecutor(
+      "kafka-fetched-data-cache-evictor"), new SystemClock, sparkConf)
+  }
 
-    val minEvictIdleTime = conf.get(CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
-    val evictorThreadInterval = conf.get(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
+  private val cache: mutable.Map[CacheKey, CachedFetchedDataList] = mutable.HashMap.empty
 
-    (minEvictIdleTime, evictorThreadInterval)
-  }
+  private val minEvictableIdleTimeMillis = conf.get(FETCHED_DATA_CACHE_TIMEOUT)
+  private val evictorThreadRunIntervalMillis =
+    conf.get(FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL)
 
   private def startEvictorThread(): ScheduledFuture[_] = {
-    executorService.scheduleAtFixedRate(new Runnable {
-      override def run(): Unit = {
-        Utils.tryLogNonFatalError(removeIdleFetchedData())
-      }
+    executorService.scheduleAtFixedRate(() => {
+      Utils.tryLogNonFatalError(removeIdleFetchedData())
     }, 0, evictorThreadRunIntervalMillis, TimeUnit.MILLISECONDS)
   }
 
@@ -142,18 +142,13 @@ private[kafka010] class FetchedDataPool(
   }
 
   private def removeIdleFetchedData(): Unit = synchronized {
-    val timestamp = clock.getTimeMillis()
-    val maxAllowedIdleTimestamp = timestamp - minEvictableIdleTimeMillis
+    val now = clock.getTimeMillis()
+    val maxAllowedReleasedTimestamp = now - minEvictableIdleTimeMillis
     cache.values.foreach { p: CachedFetchedDataList =>
       val expired = p.filter { q =>
-        // also check timestamp is bigger than last released timestamp to avoid
-        // the case System.currentTimeInMillis looking as "move back"
-        !q.inUse && timestamp > q.lastReleasedTimestamp &&
-          q.lastReleasedTimestamp < maxAllowedIdleTimestamp
-      }
-      expired.foreach {
-        idle => p -= idle
+        !q.inUse && q.lastReleasedTimestamp < maxAllowedReleasedTimestamp
       }
+      p --= expired
       numTotalElements.add(-1 * expired.size)
     }
   }
@@ -180,13 +175,4 @@ private[kafka010] object FetchedDataPool {
   }
 
   private[kafka010] type CachedFetchedDataList = mutable.ListBuffer[CachedFetchedData]
-
-  def build(executorService: ScheduledExecutorService, clock: Clock): FetchedDataPool = {
-    new FetchedDataPool(executorService, clock)
-  }
-
-  def build: FetchedDataPool = {
-    build(ThreadUtils.newDaemonSingleThreadScheduledExecutor(
-      "kafka-fetched-data-cache-evictor"), new SystemClock)
-  }
 }
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
index fea4831333b7..d2ba6df23e40 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
@@ -23,7 +23,7 @@ import java.util.concurrent.ConcurrentHashMap
 import org.apache.commons.pool2.{BaseKeyedPooledObjectFactory, PooledObject, SwallowedExceptionListener}
 import org.apache.commons.pool2.impl.{DefaultEvictionPolicy, DefaultPooledObject, GenericKeyedObjectPool, GenericKeyedObjectPoolConfig}
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.SparkConf
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.kafka010.InternalKafkaConsumerPool._
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
@@ -36,7 +36,7 @@ import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
  * returnObject() if the object is healthy to return to pool, or invalidateObject() if the object
  * should be destroyed.
  *
- * The soft capacity of pool is determined by "spark.sql.kafkaConsumerCache.capacity" config value,
+ * The soft capacity of pool is determined by "spark.kafka.consumer.cache.capacity" config value,
  * and the pool will have reasonable default value if the value is not provided.
  * (The instance will do its best effort to respect soft capacity but it can exceed when there's
  * a borrowing request and there's neither free space nor idle object to clear.)
@@ -49,6 +49,10 @@ private[kafka010] class InternalKafkaConsumerPool(
     objectFactory: ObjectFactory,
     poolConfig: PoolConfig) {
 
+  def this(conf: SparkConf) = {
+    this(new ObjectFactory, new PoolConfig(conf))
+  }
+
   // the class is intended to have only soft capacity
   assert(poolConfig.getMaxTotal < 0)
 
@@ -138,23 +142,13 @@ private[kafka010] class InternalKafkaConsumerPool(
 }
 
 private[kafka010] object InternalKafkaConsumerPool {
-
-  /**
-   * Builds the pool for [[InternalKafkaConsumer]]. The pool instance is created per each call.
-   */
-  def build: InternalKafkaConsumerPool = {
-    val objFactory = new ObjectFactory
-    val poolConfig = new PoolConfig
-    new InternalKafkaConsumerPool(objFactory, poolConfig)
-  }
-
   object CustomSwallowedExceptionListener extends SwallowedExceptionListener with Logging {
     override def onSwallowException(e: Exception): Unit = {
       logError(s"Error closing Kafka consumer", e)
     }
   }
 
-  class PoolConfig extends GenericKeyedObjectPoolConfig[InternalKafkaConsumer] {
+  class PoolConfig(conf: SparkConf) extends GenericKeyedObjectPoolConfig[InternalKafkaConsumer] {
     private var _softMaxSize = Int.MaxValue
 
     def softMaxSize(): Int = _softMaxSize
@@ -162,14 +156,12 @@ private[kafka010] object InternalKafkaConsumerPool {
     init()
 
     def init(): Unit = {
-      val conf = SparkEnv.get.conf
-
       _softMaxSize = conf.get(CONSUMER_CACHE_CAPACITY)
 
       val jmxEnabled = conf.get(CONSUMER_CACHE_JMX_ENABLED)
-      val minEvictableIdleTimeMillis = conf.get(CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS)
+      val minEvictableIdleTimeMillis = conf.get(CONSUMER_CACHE_TIMEOUT)
       val evictorThreadRunIntervalMillis = conf.get(
-        CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS)
+        CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL)
 
       // NOTE: Below lines define the behavior, so do not modify unless you know what you are
       // doing, and update the class doc accordingly if necessary when you modify.
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
index 0cba9f7e59eb..e8a3da312ebc 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
@@ -26,7 +26,7 @@ import scala.collection.JavaConverters._
 import org.apache.kafka.clients.consumer.{ConsumerConfig, ConsumerRecord, KafkaConsumer, OffsetOutOfRangeException}
 import org.apache.kafka.common.TopicPartition
 
-import org.apache.spark.TaskContext
+import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.internal.Logging
 import org.apache.spark.kafka010.KafkaConfigUpdater
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.{AvailableOffsetRange, UNKNOWN_OFFSET}
@@ -293,6 +293,12 @@ private[kafka010] class KafkaDataConsumer(
         }
       } catch {
         case e: OffsetOutOfRangeException =>
+          // When there is some error thrown, it's better to use a new consumer to drop all cached
+          // states in the old consumer. We don't need to worry about the performance because this
+          // is not a common path.
+          releaseConsumer()
+          fetchedData.reset()
+
           reportDataLoss(topicPartition, groupId, failOnDataLoss,
             s"Cannot fetch offset $toFetchOffset", e)
           toFetchOffset = getEarliestAvailableOffsetBetween(consumer, toFetchOffset, untilOffset)
@@ -321,11 +327,18 @@ private[kafka010] class KafkaDataConsumer(
    * must call method after using the instance to make sure resources are not leaked.
    */
   def release(): Unit = {
+    releaseConsumer()
+    releaseFetchedData()
+  }
+
+  private def releaseConsumer(): Unit = {
     if (_consumer.isDefined) {
       consumerPool.returnObject(_consumer.get)
       _consumer = None
     }
+  }
 
+  private def releaseFetchedData(): Unit = {
     if (_fetchedData.isDefined) {
       fetchedDataPool.release(cacheKey, _fetchedData.get)
       _fetchedData = None
@@ -566,8 +579,9 @@ private[kafka010] object KafkaDataConsumer extends Logging {
       this(kafkaParams.get(ConsumerConfig.GROUP_ID_CONFIG).asInstanceOf[String], topicPartition)
   }
 
-  private val consumerPool = InternalKafkaConsumerPool.build
-  private val fetchedDataPool = FetchedDataPool.build
+  private val sparkConf = SparkEnv.get.conf
+  private val consumerPool = new InternalKafkaConsumerPool(sparkConf)
+  private val fetchedDataPool = new FetchedDataPool(sparkConf)
 
   ShutdownHookManager.addShutdownHook { () =>
     try {
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
index b24c0f1aa143..c68ec9bccd7f 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
@@ -45,18 +45,33 @@ package object kafka010 {   // scalastyle:ignore
       .booleanConf
       .createWithDefault(false)
 
-  private[kafka010] val CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS =
-    ConfigBuilder("spark.kafka.consumer.cache.minEvictableIdleTimeMillis")
-      .doc("The minimum amount of time an object may sit idle in the pool before " +
-        "it is eligible for eviction by the idle object evictor. " +
-        "When non-positive, no objects will be evicted from the pool due to idle time alone.")
+  private[kafka010] val CONSUMER_CACHE_TIMEOUT =
+    ConfigBuilder("spark.kafka.consumer.cache.timeout")
+      .doc("The minimum amount of time a consumer may sit idle in the pool before " +
+        "it is eligible for eviction by the evictor. " +
+        "When non-positive, no consumers will be evicted from the pool due to idle time alone.")
       .timeConf(TimeUnit.MILLISECONDS)
       .createWithDefaultString("5m")
 
-  private[kafka010] val CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS =
-    ConfigBuilder("spark.kafka.consumer.cache.evictorThreadRunIntervalMillis")
-      .doc("The number of milliseconds to sleep between runs of the idle object evictor thread. " +
-        "When non-positive, no idle object evictor thread will be run.")
+  private[kafka010] val FETCHED_DATA_CACHE_TIMEOUT =
+    ConfigBuilder("spark.kafka.consumer.fetchedData.cache.timeout")
+      .doc("The minimum amount of time a fetched data may sit idle in the pool before " +
+        "it is eligible for eviction by the evictor. " +
+        "When non-positive, no fetched data will be evicted from the pool due to idle time alone.")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("5m")
+
+  private[kafka010] val CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL =
+    ConfigBuilder("spark.kafka.consumer.cache.evictorThreadRunInterval")
+      .doc("The interval of time between runs of the idle evictor thread for consumer pool. " +
+        "When non-positive, no idle evictor thread will be run.")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("3m")
+
+  private[kafka010] val FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL =
+    ConfigBuilder("spark.kafka.consumer.fetchedData.cache.evictorThreadRunInterval")
+      .doc("The interval of time between runs of the idle evictor thread for fetched data pool. " +
+        "When non-positive, no idle evictor thread will be run.")
       .timeConf(TimeUnit.MILLISECONDS)
       .createWithDefaultString("3m")
 }
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
index 4829fa9908c2..e17f414c4a41 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -28,7 +28,7 @@ import org.apache.kafka.common.TopicPartition
 import org.jmock.lib.concurrent.DeterministicScheduler
 import org.scalatest.PrivateMethodTester
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.ManualClock
@@ -48,7 +48,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("acquire fresh one") {
-    val dataPool = FetchedDataPool.build
+    val dataPool = new FetchedDataPool(new SparkConf())
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
@@ -72,7 +72,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("acquire fetched data from multiple keys") {
-    val dataPool = FetchedDataPool.build
+    val dataPool = new FetchedDataPool(new SparkConf())
 
     val cacheKeys = (0 until 10).map { partId =>
       CacheKey("testgroup", new TopicPartition("topic", partId))
@@ -109,7 +109,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("continuous use of fetched data from single key") {
-    val dataPool = FetchedDataPool.build
+    val dataPool = new FetchedDataPool(new SparkConf())
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
@@ -146,7 +146,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("multiple tasks referring same key continuously using fetched data") {
-    val dataPool = FetchedDataPool.build
+    val dataPool = new FetchedDataPool(new SparkConf())
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
@@ -206,90 +206,87 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
   }
 
   test("evict idle fetched data") {
-    val minEvictableIdleTimeMillis = 2000
-    val evictorThreadRunIntervalMillis = 500
+    val minEvictableIdleTimeMillis = 2000L
+    val evictorThreadRunIntervalMillis = 500L
 
-    val newConf = Seq(
-      CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS.key -> minEvictableIdleTimeMillis.toString,
-      CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS.key ->
-        evictorThreadRunIntervalMillis.toString)
+    val conf = new SparkConf()
+    conf.set(CONSUMER_CACHE_TIMEOUT, minEvictableIdleTimeMillis)
+    conf.set(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL, evictorThreadRunIntervalMillis)
 
-    withSparkConf(newConf: _*) {
-      val scheduler = new DeterministicScheduler()
-      val clock = new ManualClock()
-      val dataPool = FetchedDataPool.build(scheduler, clock)
+    val scheduler = new DeterministicScheduler()
+    val clock = new ManualClock()
+    val dataPool = new FetchedDataPool(scheduler, clock, conf)
 
-      val cacheKeys = (0 until 10).map { partId =>
-        CacheKey("testgroup", new TopicPartition("topic", partId))
-      }
+    val cacheKeys = (0 until 10).map { partId =>
+      CacheKey("testgroup", new TopicPartition("topic", partId))
+    }
 
-      val dataList = cacheKeys.map(key => (key, dataPool.acquire(key, 0)))
+    val dataList = cacheKeys.map(key => (key, dataPool.acquire(key, 0)))
 
-      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 10)
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 10)
 
-      dataList.map { case (_, data) =>
-        data.withNewPoll(testRecords(0, 5).listIterator, 5)
-      }
+    dataList.map { case (_, data) =>
+      data.withNewPoll(testRecords(0, 5).listIterator, 5)
+    }
 
-      val dataToEvict = dataList.take(3)
-      // release key with around 500 ms delay, so that we can check eviction per key
-      dataToEvict.foreach { case (key, data) =>
-        dataPool.release(key, data)
-        clock.advance(500)
-      }
+    val dataToEvict = dataList.take(3)
+    // release key with around 500 ms delay, so that we can check eviction per key
+    dataToEvict.foreach { case (key, data) =>
+      dataPool.release(key, data)
+      clock.advance(500)
+    }
 
-      // time elapsed after releasing
-      // first key: 1500ms, second key: 1000 ms, third key: 500 ms
+    // time elapsed after releasing
+    // first key: 1500ms, second key: 1000 ms, third key: 500 ms
 
-      // advancing - first key: 2100ms, second key: 1600 ms, third key: 1100 ms
-      clock.advance(600)
+    // advancing - first key: 2100ms, second key: 1600 ms, third key: 1100 ms
+    clock.advance(600)
 
-      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
-      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
-      assert(getCache(dataPool)(dataToEvict(1)._1).nonEmpty)
-      assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
+    scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+    assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+    assert(getCache(dataPool)(dataToEvict(1)._1).nonEmpty)
+    assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
 
-      // advancing - second key: 2100 ms, third key: 1600 ms
-      clock.advance(500)
+    // advancing - second key: 2100 ms, third key: 1600 ms
+    clock.advance(500)
 
-      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
-      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
-      assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
-      assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
+    scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+    assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+    assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
+    assert(getCache(dataPool)(dataToEvict(2)._1).nonEmpty)
 
-      // advancing - third key: 2300 ms
-      clock.advance(500)
+    // advancing - third key: 2300 ms
+    clock.advance(500)
 
-      scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
-      assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
-      assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
-      assert(getCache(dataPool)(dataToEvict(2)._1).isEmpty)
+    scheduler.tick(minEvictableIdleTimeMillis + 100, TimeUnit.MILLISECONDS)
+    assert(getCache(dataPool)(dataToEvict(0)._1).isEmpty)
+    assert(getCache(dataPool)(dataToEvict(1)._1).isEmpty)
+    assert(getCache(dataPool)(dataToEvict(2)._1).isEmpty)
 
-      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
-      assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
+    assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
 
-      dataList.takeRight(3).foreach { case (key, data) =>
-        dataPool.release(key, data)
-      }
+    dataList.takeRight(3).foreach { case (key, data) =>
+      dataPool.release(key, data)
+    }
 
-      // add objects to be candidates for eviction
-      clock.advance(minEvictableIdleTimeMillis + 100)
+    // add objects to be candidates for eviction
+    clock.advance(minEvictableIdleTimeMillis + 100)
 
-      // ensure releasing more objects don't trigger eviction unless evictor runs
-      assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
-      assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
+    // ensure releasing more objects don't trigger eviction unless evictor runs
+    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 10, expectedNumTotal = 7)
+    assert(getCache(dataPool).values.map(_.size).sum === dataList.size - dataToEvict.size)
 
-      try {
-        dataPool.shutdown()
-      } catch {
-        // ignore as it's known issue, DeterministicScheduler doesn't support shutdown
-        case _: UnsupportedOperationException =>
-      }
+    try {
+      dataPool.shutdown()
+    } catch {
+      // ignore as it's known issue, DeterministicScheduler doesn't support shutdown
+      case _: UnsupportedOperationException =>
     }
   }
 
   test("invalidate key") {
-    val dataPool = FetchedDataPool.build
+    val dataPool = new FetchedDataPool(new SparkConf())
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
@@ -335,28 +332,6 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
     }.toList.asJava
   }
 
-  private def withSparkConf(pairs: (String, String)*)(f: => Unit): Unit = {
-    val conf = SparkEnv.get.conf
-
-    val (keys, values) = pairs.unzip
-    val currentValues = keys.map { key =>
-      if (conf.contains(key)) {
-        Some(conf.get(key))
-      } else {
-        None
-      }
-    }
-
-    (keys, values).zipped.foreach { conf.set }
-
-    try f finally {
-      keys.zip(currentValues).foreach {
-        case (key, Some(value)) => conf.set(key, value)
-        case (key, None) => conf.remove(key)
-      }
-    }
-  }
-
   private def assertFetchedDataPoolStatistic(
       fetchedDataPool: FetchedDataPool,
       expectedNumCreated: Long,
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
index 497c784c238e..78d7feef5851 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPoolSuite.scala
@@ -25,14 +25,14 @@ import org.apache.kafka.clients.consumer.ConsumerConfig._
 import org.apache.kafka.common.TopicPartition
 import org.apache.kafka.common.serialization.ByteArrayDeserializer
 
-import org.apache.spark.SparkEnv
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
 import org.apache.spark.sql.test.SharedSparkSession
 
 class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
 
   test("basic multiple borrows and returns for single key") {
-    val pool = InternalKafkaConsumerPool.build
+    val pool = new InternalKafkaConsumerPool(new SparkConf())
 
     val topic = "topic"
     val partitionId = 0
@@ -72,7 +72,7 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
   }
 
   test("basic borrow and return for multiple keys") {
-    val pool = InternalKafkaConsumerPool.build
+    val pool = new InternalKafkaConsumerPool(new SparkConf())
 
     val kafkaParams = getTestKafkaParams
     val topicPartitions = createTopicPartitions(Seq("topic", "topic2"), 6)
@@ -139,67 +139,58 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
         ju.Map[String, Object],
         Seq[(CacheKey, InternalKafkaConsumer)]) => Unit): Unit = {
     val capacity = 16
-    val newConf = newConfForKafkaPool(Some(capacity), Some(-1), Some(-1))
 
-    withSparkConf(newConf: _*) {
-      val pool = InternalKafkaConsumerPool.build
+    val conf = new SparkConf()
+    conf.set(CONSUMER_CACHE_CAPACITY, capacity)
+    conf.set(CONSUMER_CACHE_TIMEOUT, -1L)
+    conf.set(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL, -1L)
 
-      try {
-        val kafkaParams = getTestKafkaParams
-        val topicPartitions = createTopicPartitions(Seq("topic"), capacity)
-        val keys = createCacheKeys(topicPartitions, kafkaParams)
+    val pool = new InternalKafkaConsumerPool(conf)
 
-        // borrow objects which makes pool reaching soft capacity
-        val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
+    try {
+      val kafkaParams = getTestKafkaParams
+      val topicPartitions = createTopicPartitions(Seq("topic"), capacity)
+      val keys = createCacheKeys(topicPartitions, kafkaParams)
+
+      // borrow objects which makes pool reaching soft capacity
+      val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
 
-        testFn(pool, kafkaParams, keyToPooledObjectPairs)
-      } finally {
-        pool.close()
-      }
+      testFn(pool, kafkaParams, keyToPooledObjectPairs)
+    } finally {
+      pool.close()
     }
   }
 
   test("evicting idle objects on background") {
     import org.scalatest.time.SpanSugar._
 
-    val minEvictableIdleTimeMillis = 3 * 1000 // 3 seconds
-    val evictorThreadRunIntervalMillis = 500 // triggering multiple evictions by intention
+    val minEvictableIdleTimeMillis = 3 * 1000L // 3 seconds
+    val evictorThreadRunIntervalMillis = 500L // triggering multiple evictions by intention
 
-    val newConf = newConfForKafkaPool(None, Some(minEvictableIdleTimeMillis),
-      Some(evictorThreadRunIntervalMillis))
-    withSparkConf(newConf: _*) {
-      val pool = InternalKafkaConsumerPool.build
+    val conf = new SparkConf()
+    conf.set(CONSUMER_CACHE_TIMEOUT, minEvictableIdleTimeMillis)
+    conf.set(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL, evictorThreadRunIntervalMillis)
 
-      val kafkaParams = getTestKafkaParams
-      val topicPartitions = createTopicPartitions(Seq("topic"), 10)
-      val keys = createCacheKeys(topicPartitions, kafkaParams)
-
-      // borrow and return some consumers to ensure some partitions are being idle
-      // this test covers the use cases: rebalance / topic removal happens while running query
-      val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
-      val objectsToReturn = keyToPooledObjectPairs.filter(_._1.topicPartition.partition() % 2 == 0)
-      returnObjects(pool, objectsToReturn)
+    val pool = new InternalKafkaConsumerPool(conf)
 
-      // wait up to twice than minEvictableIdleTimeMillis to ensure evictor thread to clear up
-      // idle objects
-      eventually(timeout((minEvictableIdleTimeMillis.toLong * 2).seconds),
-        interval(evictorThreadRunIntervalMillis.milliseconds)) {
-        assertPoolState(pool, numIdle = 0, numActive = 5, numTotal = 5)
-      }
+    val kafkaParams = getTestKafkaParams
+    val topicPartitions = createTopicPartitions(Seq("topic"), 10)
+    val keys = createCacheKeys(topicPartitions, kafkaParams)
 
-      pool.close()
+    // borrow and return some consumers to ensure some partitions are being idle
+    // this test covers the use cases: rebalance / topic removal happens while running query
+    val keyToPooledObjectPairs = borrowObjectsPerKey(pool, kafkaParams, keys)
+    val objectsToReturn = keyToPooledObjectPairs.filter(_._1.topicPartition.partition() % 2 == 0)
+    returnObjects(pool, objectsToReturn)
+
+    // wait up to twice than minEvictableIdleTimeMillis to ensure evictor thread to clear up
+    // idle objects
+    eventually(timeout((minEvictableIdleTimeMillis.toLong * 2).seconds),
+      interval(evictorThreadRunIntervalMillis.milliseconds)) {
+      assertPoolState(pool, numIdle = 0, numActive = 5, numTotal = 5)
     }
-  }
 
-  private def newConfForKafkaPool(
-      capacity: Option[Int],
-      minEvictableIdleTimeMillis: Option[Long],
-      evictorThreadRunIntervalMillis: Option[Long]): Seq[(String, String)] = {
-    Seq(
-      CONSUMER_CACHE_CAPACITY.key -> capacity,
-      CONSUMER_CACHE_MIN_EVICTABLE_IDLE_TIME_MILLIS.key -> minEvictableIdleTimeMillis,
-      CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL_MILLIS.key -> evictorThreadRunIntervalMillis
-    ).filter(_._2.isDefined).map(e => (e._1 -> e._2.get.toString))
+    pool.close()
   }
 
   private def createTopicPartitions(
@@ -291,26 +282,4 @@ class InternalKafkaConsumerPoolSuite extends SharedSparkSession {
         numActive = numActiveBeforeReturning - 1, numTotal = numTotalBeforeReturning)
     }
   }
-
-  private def withSparkConf(pairs: (String, String)*)(f: => Unit): Unit = {
-    val conf = SparkEnv.get.conf
-
-    val (keys, values) = pairs.unzip
-    val currentValues = keys.map { key =>
-      if (conf.contains(key)) {
-        Some(conf.get(key))
-      } else {
-        None
-      }
-    }
-
-    (keys, values).zipped.foreach { conf.set }
-
-    try f finally {
-      keys.zip(currentValues).foreach {
-        case (key, Some(value)) => conf.set(key, value)
-        case (key, None) => conf.remove(key)
-      }
-    }
-  }
 }

From 393eadfc77e89f7018024f11e2176dbfe90345f1 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Wed, 28 Aug 2019 13:36:30 +0900
Subject: [PATCH 06/13] Fix UTs (removing invalid test, fix missing renamed
 config)

---
 .../sql/kafka010/FetchedDataPoolSuite.scala   |  4 +--
 .../sql/kafka010/KafkaSparkConfSuite.scala    | 30 -------------------
 2 files changed, 2 insertions(+), 32 deletions(-)
 delete mode 100644 external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala

diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
index e17f414c4a41..840b9a80176a 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -210,8 +210,8 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
     val evictorThreadRunIntervalMillis = 500L
 
     val conf = new SparkConf()
-    conf.set(CONSUMER_CACHE_TIMEOUT, minEvictableIdleTimeMillis)
-    conf.set(CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL, evictorThreadRunIntervalMillis)
+    conf.set(FETCHED_DATA_CACHE_TIMEOUT, minEvictableIdleTimeMillis)
+    conf.set(FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL, evictorThreadRunIntervalMillis)
 
     val scheduler = new DeterministicScheduler()
     val clock = new ManualClock()
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala
deleted file mode 100644
index ca8b8b6e186e..000000000000
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala
+++ /dev/null
@@ -1,30 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.kafka010
-
-import org.apache.spark.{LocalSparkContext, SparkConf, SparkFunSuite}
-import org.apache.spark.util.ResetSystemProperties
-
-class KafkaSparkConfSuite extends SparkFunSuite with LocalSparkContext with ResetSystemProperties {
-  test("deprecated configs") {
-    val conf = new SparkConf()
-
-    conf.set("spark.sql.kafkaConsumerCache.capacity", "32")
-    assert(conf.get(CONSUMER_CACHE_CAPACITY) === 32)
-  }
-}

From 8651bf62610c01542df044f2e4ff2939c961178b Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Thu, 29 Aug 2019 08:00:31 +0900
Subject: [PATCH 07/13] Reflect review comments

---
 .../kafka010/InternalKafkaConsumerPool.scala  | 11 +++---
 .../sql/kafka010/FetchedDataPoolSuite.scala   | 38 -------------------
 2 files changed, 5 insertions(+), 44 deletions(-)

diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
index d2ba6df23e40..300ad7a5eff7 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
@@ -47,7 +47,7 @@ import org.apache.spark.sql.kafka010.KafkaDataConsumer.CacheKey
  */
 private[kafka010] class InternalKafkaConsumerPool(
     objectFactory: ObjectFactory,
-    poolConfig: PoolConfig) {
+    poolConfig: PoolConfig) extends Logging {
 
   def this(conf: SparkConf) = {
     this(new ObjectFactory, new PoolConfig(conf))
@@ -76,7 +76,8 @@ private[kafka010] class InternalKafkaConsumerPool(
   def borrowObject(key: CacheKey, kafkaParams: ju.Map[String, Object]): InternalKafkaConsumer = {
     updateKafkaParamForKey(key, kafkaParams)
 
-    if (size == poolConfig.softMaxSize()) {
+    if (size >= poolConfig.softMaxSize) {
+      logWarning("Pool exceeds its soft max size, cleaning up idle objects...")
       pool.clearOldest()
     }
 
@@ -151,7 +152,7 @@ private[kafka010] object InternalKafkaConsumerPool {
   class PoolConfig(conf: SparkConf) extends GenericKeyedObjectPoolConfig[InternalKafkaConsumer] {
     private var _softMaxSize = Int.MaxValue
 
-    def softMaxSize(): Int = _softMaxSize
+    def softMaxSize: Int = _softMaxSize
 
     init()
 
@@ -192,9 +193,7 @@ private[kafka010] object InternalKafkaConsumerPool {
     }
   }
 
-  class ObjectFactory extends BaseKeyedPooledObjectFactory[CacheKey, InternalKafkaConsumer]
-    with Logging {
-
+  class ObjectFactory extends BaseKeyedPooledObjectFactory[CacheKey, InternalKafkaConsumer] {
     val keyToKafkaParams = new ConcurrentHashMap[CacheKey, ju.Map[String, Object]]()
 
     override def create(key: CacheKey): InternalKafkaConsumer = {
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
index 840b9a80176a..cbe54614ef12 100644
--- a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/FetchedDataPoolSuite.scala
@@ -47,30 +47,6 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
     pool.invokePrivate(_cache())
   }
 
-  test("acquire fresh one") {
-    val dataPool = new FetchedDataPool(new SparkConf())
-
-    val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
-
-    assert(getCache(dataPool).get(cacheKey).isEmpty)
-
-    val data = dataPool.acquire(cacheKey, 0)
-
-    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
-    assert(getCache(dataPool)(cacheKey).size === 1)
-    assert(getCache(dataPool)(cacheKey).head.inUse)
-
-    data.withNewPoll(testRecords(0, 5).listIterator, 5)
-
-    dataPool.release(cacheKey, data)
-
-    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
-    assert(getCache(dataPool)(cacheKey).size === 1)
-    assert(!getCache(dataPool)(cacheKey).head.inUse)
-
-    dataPool.shutdown()
-  }
-
   test("acquire fetched data from multiple keys") {
     val dataPool = new FetchedDataPool(new SparkConf())
 
@@ -113,14 +89,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
-    assert(getCache(dataPool).get(cacheKey).isEmpty)
-
     val data = dataPool.acquire(cacheKey, 0)
-
-    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
-    assert(getCache(dataPool)(cacheKey).size === 1)
-    assert(getCache(dataPool)(cacheKey).head.inUse)
-
     data.withNewPoll(testRecords(0, 5).listIterator, 5)
 
     (0 to 3).foreach { _ => data.next() }
@@ -150,14 +119,7 @@ class FetchedDataPoolSuite extends SharedSparkSession with PrivateMethodTester {
 
     val cacheKey = CacheKey("testgroup", new TopicPartition("topic", 0))
 
-    assert(getCache(dataPool).get(cacheKey).isEmpty)
-
     val dataFromTask1 = dataPool.acquire(cacheKey, 0)
-
-    assertFetchedDataPoolStatistic(dataPool, expectedNumCreated = 1, expectedNumTotal = 1)
-    assert(getCache(dataPool)(cacheKey).size === 1)
-    assert(getCache(dataPool)(cacheKey).head.inUse)
-
     val dataFromTask2 = dataPool.acquire(cacheKey, 0)
 
     // it shouldn't give same object as dataFromTask1 though it asks same offset

From 7d0bf5e5055550a182cbc93cc8b0b4a36b677988 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Thu, 29 Aug 2019 08:20:08 +0900
Subject: [PATCH 08/13] Add TODOs against existing codebase - beyond the scope
 of current PR

---
 .../spark/sql/kafka010/InternalKafkaConsumerPool.scala       | 5 +++++
 .../org/apache/spark/sql/kafka010/KafkaDataConsumer.scala    | 4 ++++
 2 files changed, 9 insertions(+)

diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
index 300ad7a5eff7..276a942742b8 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/InternalKafkaConsumerPool.scala
@@ -128,6 +128,11 @@ private[kafka010] class InternalKafkaConsumerPool(
 
   def size(key: CacheKey): Int = numIdle(key) + numActive(key)
 
+  // TODO: revisit the relation between CacheKey and kafkaParams - for now it looks a bit weird
+  //   as we force all consumers having same (groupId, topicPartition) to have same kafkaParams
+  //   which might be viable in performance perspective (kafkaParams might be too huge to use
+  //   as a part of key), but there might be the case kafkaParams could be different -
+  //   cache key should be differentiated for both kafkaParams.
   private def updateKafkaParamForKey(key: CacheKey, kafkaParams: ju.Map[String, Object]): Unit = {
     // We can assume that kafkaParam should not be different for same cache key,
     // otherwise we can't reuse the cached object and cache key should contain kafkaParam.
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
index e8a3da312ebc..87036beb9a25 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaDataConsumer.scala
@@ -122,6 +122,8 @@ private[kafka010] class InternalKafkaConsumer(
   }
 }
 
+// TODO: consider changing this to normal class, as having mutable variables in
+//   case class sounds weird.
 /**
  * The internal object to store the fetched data from Kafka consumer and the next offset to poll.
  *
@@ -182,6 +184,8 @@ private[kafka010] case class FetchedData(
   def offsetAfterPoll: Long = _offsetAfterPoll
 }
 
+// TODO: consider changing this to normal class, as having mutable variables in
+//   case class sounds weird.
 /**
  * The internal object returned by the `fetchRecord` method. If `record` is empty, it means it is
  * invisible (either a transaction message, or an aborted message when the consumer's

From 04e9ddf39811f18c8ed63a639897155ec290c270 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Fri, 30 Aug 2019 23:58:05 +0900
Subject: [PATCH 09/13] Rollback my bad - they shouldn't be touched

---
 .../scala/org/apache/spark/SparkConf.scala    |  4 ++-
 .../sql/kafka010/KafkaSparkConfSuite.scala    | 30 +++++++++++++++++++
 2 files changed, 33 insertions(+), 1 deletion(-)
 create mode 100644 external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala

diff --git a/core/src/main/scala/org/apache/spark/SparkConf.scala b/core/src/main/scala/org/apache/spark/SparkConf.scala
index bc3a4affac50..24be54ec9182 100644
--- a/core/src/main/scala/org/apache/spark/SparkConf.scala
+++ b/core/src/main/scala/org/apache/spark/SparkConf.scala
@@ -714,7 +714,9 @@ private[spark] object SparkConf extends Logging {
       AlternateConfig("spark.yarn.kerberos.relogin.period", "3.0")),
     KERBEROS_FILESYSTEMS_TO_ACCESS.key -> Seq(
       AlternateConfig("spark.yarn.access.namenodes", "2.2"),
-      AlternateConfig("spark.yarn.access.hadoopFileSystems", "3.0"))
+      AlternateConfig("spark.yarn.access.hadoopFileSystems", "3.0")),
+    "spark.kafka.consumer.cache.capacity" -> Seq(
+      AlternateConfig("spark.sql.kafkaConsumerCache.capacity", "3.0"))
   )
 
   /**
diff --git a/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala
new file mode 100644
index 000000000000..ca8b8b6e186e
--- /dev/null
+++ b/external/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSparkConfSuite.scala
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.kafka010
+
+import org.apache.spark.{LocalSparkContext, SparkConf, SparkFunSuite}
+import org.apache.spark.util.ResetSystemProperties
+
+class KafkaSparkConfSuite extends SparkFunSuite with LocalSparkContext with ResetSystemProperties {
+  test("deprecated configs") {
+    val conf = new SparkConf()
+
+    conf.set("spark.sql.kafkaConsumerCache.capacity", "32")
+    assert(conf.get(CONSUMER_CACHE_CAPACITY) === 32)
+  }
+}

From 297f47a1c780898435785f1c2b0cb033408673f6 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Tue, 3 Sep 2019 09:43:03 +0900
Subject: [PATCH 10/13] Update document to reflect changes on consumer pool and
 fetched data pool

---
 .../structured-streaming-kafka-integration.md | 68 ++++++++++++++++---
 .../apache/spark/sql/kafka010/package.scala   | 14 ++--
 2 files changed, 66 insertions(+), 16 deletions(-)

diff --git a/docs/structured-streaming-kafka-integration.md b/docs/structured-streaming-kafka-integration.md
index 339792b4139f..d18463ea3ed6 100644
--- a/docs/structured-streaming-kafka-integration.md
+++ b/docs/structured-streaming-kafka-integration.md
@@ -430,20 +430,70 @@ The following configurations are optional:
 ### Consumer Caching
 
 It's time-consuming to initialize Kafka consumers, especially in streaming scenarios where processing time is a key factor.
-Because of this, Spark caches Kafka consumers on executors. The caching key is built up from the following information:
+Because of this, Spark pools Kafka consumers on executors, by leveraging Apache Commons Pool.
+
+The caching key is built up from the following information:
+
 * Topic name
 * Topic partition
 * Group ID
 
-The size of the cache is limited by <code>spark.kafka.consumer.cache.capacity</code> (default: 64).
-If this threshold is reached, it tries to remove the least-used entry that is currently not in use.
-If it cannot be removed, then the cache will keep growing. In the worst case, the cache will grow to
-the max number of concurrent tasks that can run in the executor (that is, number of tasks slots),
-after which it will never reduce.
+The following properties are available to configure the consumer pool:
+
+<table class="table">
+<tr><th>Property Name</th><th>Default</th><th>Meaning</th></tr>
+<tr>
+  <td>spark.kafka.consumer.cache.capacity</td>
+  <td>The maximum number of consumers cached. Please note that it's a soft limit.</td>
+  <td>64</td>
+</tr>
+<tr>
+  <td>spark.kafka.consumer.cache.timeout</td>
+  <td>The minimum amount of time a consumer may sit idle in the pool before it is eligible for eviction by the evictor.</td>
+  <td>5m (5 minutes)</td>
+</tr>
+<tr>
+  <td>spark.kafka.consumer.cache.jmx.enable</td>
+  <td>Enable or disable JMX for pools created with this configuration instance. Statistics of the pool are available via JMX instance.
+  The prefix of JMX name is set to "kafka010-cached-simple-kafka-consumer-pool".
+  </td>
+  <td>false</td>
+</tr>
+</table>
+
+The size of the pool is limited by <code>spark.kafka.consumer.cache.capacity</code>,
+but it works as "soft-limit" to not block Spark tasks.
+
+Idle eviction thread periodically removes some consumers which are not used. If this threshold is reached when borrowing,
+it tries to remove the least-used entry that is currently not in use.
+
+If it cannot be removed, then the pool will keep growing. In the worst case, the pool will grow to
+the max number of concurrent tasks that can run in the executor (that is, number of tasks slots).
+
+If a task fails for any reason, the new task is executed with a newly created Kafka consumer for safety reasons.
+At the same time, we invalidate all consumers in pool which have same caching key, to remove consumer which was used
+in failed execution. Consumers which any other tasks are using will not be closed, but will be invalidated as well
+when they are returned into pool.
 
-If a task fails for any reason the new task is executed with a newly created Kafka consumer for safety reasons.
-At the same time the cached Kafka consumer which was used in the failed execution will be invalidated. Here it has to
-be emphasized it will not be closed if any other task is using it.
+Along with consumers, Spark pools the records fetched from Kafka separately, to let Kafka consumers stateless in point
+of Spark's view, and maximize the efficiency of pooling. It leverages same cache key with Kafka consumers pool.
+Note that it doesn't leverage Apache Commons Pool due to the difference of characteristics.
+
+The following properties are available to configure the fetched data pool:
+
+<table class="table">
+<tr><th>Property Name</th><th>Default</th><th>Meaning</th></tr>
+<tr>
+  <td>spark.kafka.consumer.fetchedData.cache.timeout</td>
+  <td>The maximum number of fetched data cached. Please note that it's a soft limit.</td>
+  <td>64</td>
+</tr>
+<tr>
+  <td>spark.kafka.consumer.fetchedData.cache.evictorThreadRunInterval</td>
+  <td>The minimum amount of time a fetched data may sit idle in the pool before it is eligible for eviction by the evictor.</td>
+  <td>5m (5 minutes)</td>
+</tr>
+</table>
 
 ## Writing Data to Kafka
 
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
index c68ec9bccd7f..c7784b90aba9 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
@@ -53,6 +53,13 @@ package object kafka010 {   // scalastyle:ignore
       .timeConf(TimeUnit.MILLISECONDS)
       .createWithDefaultString("5m")
 
+  private[kafka010] val CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL =
+    ConfigBuilder("spark.kafka.consumer.cache.evictorThreadRunInterval")
+      .doc("The interval of time between runs of the idle evictor thread for consumer pool. " +
+        "When non-positive, no idle evictor thread will be run.")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("3m")
+
   private[kafka010] val FETCHED_DATA_CACHE_TIMEOUT =
     ConfigBuilder("spark.kafka.consumer.fetchedData.cache.timeout")
       .doc("The minimum amount of time a fetched data may sit idle in the pool before " +
@@ -61,13 +68,6 @@ package object kafka010 {   // scalastyle:ignore
       .timeConf(TimeUnit.MILLISECONDS)
       .createWithDefaultString("5m")
 
-  private[kafka010] val CONSUMER_CACHE_EVICTOR_THREAD_RUN_INTERVAL =
-    ConfigBuilder("spark.kafka.consumer.cache.evictorThreadRunInterval")
-      .doc("The interval of time between runs of the idle evictor thread for consumer pool. " +
-        "When non-positive, no idle evictor thread will be run.")
-      .timeConf(TimeUnit.MILLISECONDS)
-      .createWithDefaultString("3m")
-
   private[kafka010] val FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL =
     ConfigBuilder("spark.kafka.consumer.fetchedData.cache.evictorThreadRunInterval")
       .doc("The interval of time between runs of the idle evictor thread for fetched data pool. " +

From fa12a0a6ee023d52a9257d76415556d5d49902de Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Tue, 3 Sep 2019 09:58:49 +0900
Subject: [PATCH 11/13] slightly modified

---
 docs/structured-streaming-kafka-integration.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/structured-streaming-kafka-integration.md b/docs/structured-streaming-kafka-integration.md
index d18463ea3ed6..0959a250cc9d 100644
--- a/docs/structured-streaming-kafka-integration.md
+++ b/docs/structured-streaming-kafka-integration.md
@@ -464,8 +464,8 @@ The following properties are available to configure the consumer pool:
 The size of the pool is limited by <code>spark.kafka.consumer.cache.capacity</code>,
 but it works as "soft-limit" to not block Spark tasks.
 
-Idle eviction thread periodically removes some consumers which are not used. If this threshold is reached when borrowing,
-it tries to remove the least-used entry that is currently not in use.
+Idle eviction thread periodically removes some consumers which are not used longer than given timeout. 
+If this threshold is reached when borrowing, it tries to remove the least-used entry that is currently not in use.
 
 If it cannot be removed, then the pool will keep growing. In the worst case, the pool will grow to
 the max number of concurrent tasks that can run in the executor (that is, number of tasks slots).

From 74a6cbfbcb60b53fae62ff2111d85539d81130f6 Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Wed, 4 Sep 2019 13:49:20 +0900
Subject: [PATCH 12/13] Address review comments, also fix the code when idle
 evictor interval <= 0 for fetched pool

---
 docs/structured-streaming-kafka-integration.md  | 17 +++++++++++------
 .../spark/sql/kafka010/FetchedDataPool.scala    | 15 ++++++++++-----
 2 files changed, 21 insertions(+), 11 deletions(-)

diff --git a/docs/structured-streaming-kafka-integration.md b/docs/structured-streaming-kafka-integration.md
index 0959a250cc9d..133026a95ed3 100644
--- a/docs/structured-streaming-kafka-integration.md
+++ b/docs/structured-streaming-kafka-integration.md
@@ -452,6 +452,11 @@ The following properties are available to configure the consumer pool:
   <td>The minimum amount of time a consumer may sit idle in the pool before it is eligible for eviction by the evictor.</td>
   <td>5m (5 minutes)</td>
 </tr>
+<tr>
+  <td>spark.kafka.consumer.cache.evictorThreadRunInterval</td>
+  <td>The interval of time between runs of the idle evictor thread for consumer pool. When non-positive, no idle evictor thread will be run.</td>
+  <td>3m (3 minutes)</td>
+</tr>
 <tr>
   <td>spark.kafka.consumer.cache.jmx.enable</td>
   <td>Enable or disable JMX for pools created with this configuration instance. Statistics of the pool are available via JMX instance.
@@ -464,11 +469,11 @@ The following properties are available to configure the consumer pool:
 The size of the pool is limited by <code>spark.kafka.consumer.cache.capacity</code>,
 but it works as "soft-limit" to not block Spark tasks.
 
-Idle eviction thread periodically removes some consumers which are not used longer than given timeout. 
+Idle eviction thread periodically removes consumers which are not used longer than given timeout.
 If this threshold is reached when borrowing, it tries to remove the least-used entry that is currently not in use.
 
 If it cannot be removed, then the pool will keep growing. In the worst case, the pool will grow to
-the max number of concurrent tasks that can run in the executor (that is, number of tasks slots).
+the max number of concurrent tasks that can run in the executor (that is, number of task slots).
 
 If a task fails for any reason, the new task is executed with a newly created Kafka consumer for safety reasons.
 At the same time, we invalidate all consumers in pool which have same caching key, to remove consumer which was used
@@ -485,13 +490,13 @@ The following properties are available to configure the fetched data pool:
 <tr><th>Property Name</th><th>Default</th><th>Meaning</th></tr>
 <tr>
   <td>spark.kafka.consumer.fetchedData.cache.timeout</td>
-  <td>The maximum number of fetched data cached. Please note that it's a soft limit.</td>
-  <td>64</td>
+  <td>The minimum amount of time a fetched data may sit idle in the pool before it is eligible for eviction by the evictor.</td>
+  <td>5m (5 minutes)</td>
 </tr>
 <tr>
   <td>spark.kafka.consumer.fetchedData.cache.evictorThreadRunInterval</td>
-  <td>The minimum amount of time a fetched data may sit idle in the pool before it is eligible for eviction by the evictor.</td>
-  <td>5m (5 minutes)</td>
+  <td>The interval of time between runs of the idle evictor thread for fetched data pool. When non-positive, no idle evictor thread will be run.</td>
+  <td>3m (3 minutes)</td>
 </tr>
 </table>
 
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
index 506e8e89e4c9..6f18407a1700 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/FetchedDataPool.scala
@@ -57,10 +57,15 @@ private[kafka010] class FetchedDataPool(
   private val evictorThreadRunIntervalMillis =
     conf.get(FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL)
 
-  private def startEvictorThread(): ScheduledFuture[_] = {
-    executorService.scheduleAtFixedRate(() => {
-      Utils.tryLogNonFatalError(removeIdleFetchedData())
-    }, 0, evictorThreadRunIntervalMillis, TimeUnit.MILLISECONDS)
+  private def startEvictorThread(): Option[ScheduledFuture[_]] = {
+    if (evictorThreadRunIntervalMillis > 0) {
+      val future = executorService.scheduleAtFixedRate(() => {
+        Utils.tryLogNonFatalError(removeIdleFetchedData())
+      }, 0, evictorThreadRunIntervalMillis, TimeUnit.MILLISECONDS)
+      Some(future)
+    } else {
+      None
+    }
   }
 
   private var scheduled = startEvictorThread()
@@ -132,7 +137,7 @@ private[kafka010] class FetchedDataPool(
   }
 
   def reset(): Unit = synchronized {
-    scheduled.cancel(true)
+    scheduled.foreach(_.cancel(true))
 
     cache.clear()
     numTotalElements.reset()

From 68af3d56710e21b4b8a9a1640ededb3eb7d3117b Mon Sep 17 00:00:00 2001
From: "Jungtaek Lim (HeartSaVioR)" <kabhwan@gmail.com>
Date: Wed, 4 Sep 2019 19:28:44 +0900
Subject: [PATCH 13/13] Reflect review comment

---
 docs/structured-streaming-kafka-integration.md                | 4 ++--
 .../main/scala/org/apache/spark/sql/kafka010/package.scala    | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/structured-streaming-kafka-integration.md b/docs/structured-streaming-kafka-integration.md
index 133026a95ed3..c4378b4a0266 100644
--- a/docs/structured-streaming-kafka-integration.md
+++ b/docs/structured-streaming-kafka-integration.md
@@ -455,7 +455,7 @@ The following properties are available to configure the consumer pool:
 <tr>
   <td>spark.kafka.consumer.cache.evictorThreadRunInterval</td>
   <td>The interval of time between runs of the idle evictor thread for consumer pool. When non-positive, no idle evictor thread will be run.</td>
-  <td>3m (3 minutes)</td>
+  <td>1m (1 minutes)</td>
 </tr>
 <tr>
   <td>spark.kafka.consumer.cache.jmx.enable</td>
@@ -496,7 +496,7 @@ The following properties are available to configure the fetched data pool:
 <tr>
   <td>spark.kafka.consumer.fetchedData.cache.evictorThreadRunInterval</td>
   <td>The interval of time between runs of the idle evictor thread for fetched data pool. When non-positive, no idle evictor thread will be run.</td>
-  <td>3m (3 minutes)</td>
+  <td>1m (1 minutes)</td>
 </tr>
 </table>
 
diff --git a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
index c7784b90aba9..6f6ae55fc497 100644
--- a/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
+++ b/external/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/package.scala
@@ -58,7 +58,7 @@ package object kafka010 {   // scalastyle:ignore
       .doc("The interval of time between runs of the idle evictor thread for consumer pool. " +
         "When non-positive, no idle evictor thread will be run.")
       .timeConf(TimeUnit.MILLISECONDS)
-      .createWithDefaultString("3m")
+      .createWithDefaultString("1m")
 
   private[kafka010] val FETCHED_DATA_CACHE_TIMEOUT =
     ConfigBuilder("spark.kafka.consumer.fetchedData.cache.timeout")
@@ -73,5 +73,5 @@ package object kafka010 {   // scalastyle:ignore
       .doc("The interval of time between runs of the idle evictor thread for fetched data pool. " +
         "When non-positive, no idle evictor thread will be run.")
       .timeConf(TimeUnit.MILLISECONDS)
-      .createWithDefaultString("3m")
+      .createWithDefaultString("1m")
 }