apache · southernriver · Jul 15, 2020 · Dec 8, 2020 · Dec 9, 2020 · sunchao
diff --git a/build/._scala-2.12.10 b/build/._scala-2.12.10
diff --git a/build/._zinc-0.3.15 b/build/._zinc-0.3.15
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionCatalog.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionCatalog.scala
@@ -91,8 +91,18 @@ private[sql] class HiveSessionCatalog(
               isUDAFBridgeRequired = true))
             udfExpr.get.dataType // Force it to check input data types.
           } else if (classOf[GenericUDTF].isAssignableFrom(clazz)) {
-            udfExpr = Some(HiveGenericUDTF(name, new HiveFunctionWrapper(clazz.getName), input))
-            udfExpr.get.asInstanceOf[HiveGenericUDTF].elementSchema // Force it to check data types.
+            try {
+              udfExpr = Some(HiveGenericUDTF(name, new HiveFunctionWrapper(clazz.getName), input))
+              // Force it to check input data types.
+              udfExpr.get.asInstanceOf[HiveGenericUDTF].elementSchema
+            } catch {
+              case exception: Exception =>
+                logInfo(s"HiveGenericUDTF initialize(ObjectInspector[] args) is deprecated, and" +
+                  s" we will suit the latest version of initialize(StructObjectInspector argOIs).")
+                udfExpr = Some(HiveGenericUDTF(name, new HiveFunctionWrapper(clazz.getName),
+                  input, false))
+                udfExpr.get.asInstanceOf[HiveGenericUDTF].elementSchema
+            }
           }
         } catch {
           case NonFatal(e) =>

diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/hiveUDFs.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/hiveUDFs.scala
@@ -198,7 +198,8 @@ private[hive] case class HiveGenericUDF(
 private[hive] case class HiveGenericUDTF(
     name: String,
     funcWrapper: HiveFunctionWrapper,
-    children: Seq[Expression])
+    children: Seq[Expression],
+    deprecated: Boolean = true)
   extends Generator with HiveInspectors with CodegenFallback with UserDefinedExpression {
 
   @transient
@@ -212,7 +213,19 @@ private[hive] case class HiveGenericUDTF(
   protected lazy val inputInspectors = children.map(toInspector)
 
   @transient
-  protected lazy val outputInspector = function.initialize(inputInspectors.toArray)
+  protected lazy val inpuColNames = children.map(_ => "field_name").asJava
+
+  @transient
+  protected lazy val rowOI = ObjectInspectorFactory.getStandardStructObjectInspector(
+    inpuColNames, inputInspectors.asJava)
+
+  @transient
+  protected lazy val outputInspector =
+    if (deprecated) {
+      function.initialize(inputInspectors.toArray)
+    } else {
+      function.initialize(rowOI)
+    }
 
   @transient
   protected lazy val udtInput = new Array[AnyRef](children.length)

diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala
@@ -2132,11 +2132,9 @@ class SQLQuerySuite extends QueryTest with SQLTestUtils with TestHiveSingleton {
            |AS 'org.apache.spark.sql.hive.execution.UDTFStack2'
            |USING JAR '${hiveContext.getHiveFile("SPARK-21101-1.0.jar").toURI}'
         """.stripMargin)
-      val e = intercept[org.apache.spark.sql.AnalysisException] {
-        sql("SELECT udtf_stack2(2, 'A', 10, date '2015-01-01', 'B', 20, date '2016-01-01')")
-      }
-      assert(
-        e.getMessage.contains("public StructObjectInspector initialize(ObjectInspector[] args)"))
+      val num =
+        sql("SELECT udtf_stack2(2, 'A', 10, date '2015-01-01', 'B', 20, date '2016-01-01')").count()
+      assert(num === 2)
     }
   }