elastic · samxbr · Jan 3, 2025 · Dec 24, 2024 · Dec 30, 2024 · Dec 31, 2024
diff --git a/docs/src/reference/asciidoc/appendix/breaking.adoc b/docs/src/reference/asciidoc/appendix/breaking.adoc
@@ -8,6 +8,17 @@ For clarity, we always list any breaking changes at the top of the
 //NOTE: The notable-breaking-changes tagged regions are re-used in the
 //Installation and Upgrade Guide
 
+=== Deprecations in 8.18
+
+The following functionality has been deprecated in {eh} 8.18 and will be removed
+in a future version. While this won’t have an immediate impact on your
+applications, we strongly encourage you take the described steps to update your
+code after upgrading to 8.18.
+
+==== Spark 2.x support is deprecated
+
+Spark 2.x is no longer maintained. Spark 3 is still supported.
+
 [[breaking-changes-8.9]]
 === Breaking Changes in 8.9
 

diff --git a/docs/src/reference/asciidoc/core/intro/requirements.adoc b/docs/src/reference/asciidoc/core/intro/requirements.adoc
@@ -81,6 +81,8 @@ Hive version {hv-v}
 [[requirements-spark]]
 === Apache Spark
 
+deprecated::[9.0,Support for Spark 2.x in {eh} is deprecated.]
+
 Spark 2.0 or higher. We recommend using the latest release of Spark (currently {sp-v}). As {eh} provides native integration (which is recommended) with {sp}, it does not matter what binary one is using.
 The same applies when using the Hadoop layer to integrate the two as {eh} supports the majority of
 Hadoop distributions out there.

diff --git a/spark/core/src/itest/scala/org/elasticsearch/spark/integration/AbstractScalaEsSpark.scala b/spark/core/src/itest/scala/org/elasticsearch/spark/integration/AbstractScalaEsSpark.scala
@@ -854,10 +854,10 @@ class AbstractScalaEsScalaSpark(prefix: String, readMetadata: jl.Boolean) extend
     val target = resource(index, typename, version)
 
     val rawCore = List( Map("colint" -> 1, "colstr" -> "s"),
-                         Map("colint" -> null, "colstr" -> null) )
+                         Map("colint" -> 9, "colstr" -> null) )
     sc.parallelize(rawCore, 1).saveToEs(target)
     val qjson =
-      """{"query":{"range":{"colint":{"from":null,"to":"9","include_lower":true,"include_upper":true}}}}"""
+      """{"query":{"range":{"colint":{"lte":"9"}}}}"""
 
     val esRDD = EsSpark.esRDD(sc, target, qjson)
     val scRDD = sc.esRDD(target, qjson)

diff --git a/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/EsSparkSQL.scala b/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/EsSparkSQL.scala
@@ -37,6 +37,7 @@ import scala.collection.JavaConverters.mapAsJavaMapConverter
 import scala.collection.JavaConverters.propertiesAsScalaMapConverter
 import scala.collection.Map
 
+@deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
 object EsSparkSQL {
 
   private val init = { ObjectUtils.loadClass("org.elasticsearch.spark.rdd.CompatUtils", classOf[ObjectUtils].getClassLoader) }

diff --git a/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/api/java/JavaEsSparkSQL.scala b/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/api/java/JavaEsSparkSQL.scala
@@ -31,6 +31,7 @@ import org.elasticsearch.hadoop.cfg.ConfigurationOptions.ES_QUERY
 import org.elasticsearch.hadoop.cfg.ConfigurationOptions.ES_RESOURCE_READ
 import org.elasticsearch.spark.sql.EsSparkSQL
 
+@deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
 object JavaEsSparkSQL {
 
   // specify the return types to make sure the bytecode is generated properly (w/o any scala.collections in it)

diff --git a/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/package.scala b/spark/sql-20/src/main/scala/org/elasticsearch/spark/sql/package.scala
@@ -29,8 +29,10 @@ import scala.reflect.ClassTag
 
 package object sql {
 
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   implicit def sqlContextFunctions(sc: SQLContext)= new SQLContextFunctions(sc)
 
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   class SQLContextFunctions(sc: SQLContext) extends Serializable {
     def esDF() = EsSparkSQL.esDF(sc)
     def esDF(resource: String) = EsSparkSQL.esDF(sc, resource)
@@ -42,16 +44,20 @@ package object sql {
 
   // the sparkDatasetFunctions already takes care of this
   // but older clients might still import it hence why it's still here
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   implicit def sparkDataFrameFunctions(df: DataFrame) = new SparkDataFrameFunctions(df)
 
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   class SparkDataFrameFunctions(df: DataFrame) extends Serializable {
     def saveToEs(resource: String): Unit = { EsSparkSQL.saveToEs(df, resource) }
     def saveToEs(resource: String, cfg: scala.collection.Map[String, String]): Unit = { EsSparkSQL.saveToEs(df, resource, cfg) }
     def saveToEs(cfg: scala.collection.Map[String, String]): Unit = { EsSparkSQL.saveToEs(df, cfg)    }
   }
-
+
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   implicit def sparkSessionFunctions(ss: SparkSession)= new SparkSessionFunctions(ss)
-
+
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   class SparkSessionFunctions(ss: SparkSession) extends Serializable {
     def esDF() = EsSparkSQL.esDF(ss)
     def esDF(resource: String) = EsSparkSQL.esDF(ss, resource)
@@ -61,8 +67,10 @@ package object sql {
     def esDF(resource: String, query: String, cfg: scala.collection.Map[String, String]) = EsSparkSQL.esDF(ss, resource, query, cfg)
   }
 
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   implicit def sparkDatasetFunctions[T : ClassTag](ds: Dataset[T]) = new SparkDatasetFunctions(ds)
-
+
+  @deprecated("Support for Apache Spark 2 is deprecated. Use Spark 3.")
   class SparkDatasetFunctions[T : ClassTag](ds: Dataset[T]) extends Serializable {
     def saveToEs(resource: String): Unit =  { EsSparkSQL.saveToEs(ds, resource) }
     def saveToEs(resource: String, cfg: scala.collection.Map[String, String]): Unit =  { EsSparkSQL.saveToEs(ds, resource, cfg) }