apache · amanomer · Dec 9, 2019 · Dec 9, 2019 · Dec 9, 2019 · Dec 12, 2019
diff --git a/docs/sql-migration-guide.md b/docs/sql-migration-guide.md
@@ -256,6 +256,52 @@ license: |
 
   - Since Spark 3.0, the unary arithmetic operator plus(`+`) only accepts string, numeric and interval type values as inputs. Besides, `+` with a integral string representation will be coerced to double value, e.g. `+'1'` results `1.0`. In Spark version 2.4 and earlier, this operator is ignored. There is no type checking for it, thus, all type values with a `+` prefix are valid, e.g. `+ array(1, 2)` is valid and results `[1, 2]`. Besides, there is no type coercion for it at all, e.g. in Spark 2.4, the result of `+'1'` is string `1`.
 
+  - Since Spark 3.0, the parameter(first or second) to array_contains function is implicitly promoted to the wider type parameter.
+    <table class="table">
+        <tr>
+            <th>
+                <b>Query</b>
+            </th>
+            <th>
+                <b>Spark 2.4</b>
+            </th>
+            <th>
+                <b>Spark 3.0</b>
+            </th>
+            <th>
+                <b>Remarks</b>
+            </th>
+        </tr>
+        <tr>
+            <td>
+                <code>select array_contains(array(1.10), 1.1);</code>
+            </td>
+            <td>
+                <code>AnalysisException</code> is thrown.
+            </td>
+            <td>
+                <code>True</code>
+            </td>
+            <td>
+                In spark 2.4, left parameter is of <code>array(decimal(3,2))</code> where as right parameter is of <code>decimal(2,1)</code>
+            </td>
+        </tr>
+        <tr>
+            <td>
+                <code>select array_contains(array(1.1), 1.10);</code>
+            </td>
+            <td>
+                <code>AnalysisException</code> is thrown.
+            </td>
+            <td>
+                <code>True</code>
+            </td>
+            <td>
+                In spark 2.4, left parameter is of <code>array(decimal(2,1))</code> where as right parameter is of <code>decimal(3,2)</code>
+            </td>
+        </tr>
+    </table>
+
 ## Upgrading from Spark SQL 2.4 to 2.4.1
 
   - The value of `spark.executor.heartbeatInterval`, when specified without units like "30" rather than "30s", was

diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercion.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercion.scala
@@ -243,7 +243,7 @@ object TypeCoercion {
    * string. If the wider decimal type exceeds system limitation, this rule will truncate
    * the decimal type before return it.
    */
-  private[analysis] def findWiderTypeWithoutStringPromotionForTwo(
+  private[catalyst] def findWiderTypeWithoutStringPromotionForTwo(
       t1: DataType,
       t2: DataType): Option[DataType] = {
     findTightestCommonType(t1, t2)

diff --git a/...alyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala b/...alyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala
@@ -1081,7 +1081,7 @@ case class ArrayContains(left: Expression, right: Expression)
     (left.dataType, right.dataType) match {
       case (_, NullType) => Seq.empty
       case (ArrayType(e1, hasNull), e2) =>
-        TypeCoercion.findTightestCommonType(e1, e2) match {
+        TypeCoercion.findWiderTypeWithoutStringPromotionForTwo(e1, e2) match {
           case Some(dt) => Seq(ArrayType(dt, hasNull), dt)
           case _ => Seq.empty
         }

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameFunctionsSuite.scala
@@ -850,7 +850,7 @@ class DataFrameFunctionsSuite extends QueryTest with SharedSparkSession {
     val errorMsg1 =
       s"""
          |Input to function array_contains should have been array followed by a
-         |value with same element type, but it's [array<int>, decimal(29,29)].
+         |value with same element type, but it's [array<int>, decimal(38,29)].
 case e: ImplicitCastInputTypes if e.inputTypes.nonEmpty => 
   val children: Seq[Expression] = e.children.zip(e.inputTypes).map { case (in, expected) => 
     // If we cannot do the implicit cast, just use the original input. 
     implicitCast(in, expected).getOrElse(in) 
   } 
   e.withNewChildren(children) 
 case e: ImplicitCastInputTypes if e.inputTypes.nonEmpty => 
   val children: Seq[Expression] = e.children.zip(e.inputTypes).map { case (in, expected) => 
     // If we cannot do the implicit cast, just use the original input. 
     implicitCast(in, expected).getOrElse(in) 
   } 
   e.withNewChildren(children) 
 case e: ImplicitCastInputTypes if e.inputTypes.nonEmpty => 
   val children: Seq[Expression] = e.children.zip(e.inputTypes).map { case (in, expected) => 
     // If we cannot do the implicit cast, just use the original input. 
     implicitCast(in, expected).getOrElse(in) 
   } 
   e.withNewChildren(children) 
 case e: ImplicitCastInputTypes if e.inputTypes.nonEmpty => 
   val children: Seq[Expression] = e.children.zip(e.inputTypes).map { case (in, expected) => 
     // If we cannot do the implicit cast, just use the original input. 
     implicitCast(in, expected).getOrElse(in) 
   } 
   e.withNewChildren(children) 
        """.stripMargin.replace("\n", " ").trim()
     assert(e1.message.contains(errorMsg1))
 
@@ -863,6 +863,21 @@ class DataFrameFunctionsSuite extends QueryTest with SharedSparkSession {
          |value with same element type, but it's [array<int>, string].
        """.stripMargin.replace("\n", " ").trim()
     assert(e2.message.contains(errorMsg2))
+
+    checkAnswer(
+      sql("select array_contains(array(1.10), 1.1)"),
+      Seq(Row(true))
+    )
+
+    checkAnswer(
+      sql("SELECT array_contains(array(1.1), 1.10)"),
+      Seq(Row(true))
+    )
+
+    checkAnswer(
+      sql("SELECT array_contains(array(1.11), 1.1)"),
+      Seq(Row(false))
+    )
   }
 
   test("arrays_overlap function") {