Add a comment.

apache · ueshin · Mar 22, 2019 · Mar 22, 2019 · Mar 25, 2019 · Mar 22, 2019
commit f8b34041fe16f64aac2baaf14e32925635984ff8
diff --git a/python/pyspark/worker.py b/python/pyspark/worker.py
@@ -253,6 +253,8 @@ def read_udfs(pickleSer, infile, eval_type):
             "spark.sql.legacy.execution.pandas.groupedMap.assignColumnsByName", "true")\
             .lower() == "true"
 
+        # Scalar Pandas UDF handles struct type arguments as pandas DataFrames instead of
+        # pandas Series. See SPARK-27240.
         df_for_struct = eval_type == PythonEvalType.SQL_SCALAR_PANDAS_UDF
         ser = ArrowStreamPandasUDFSerializer(timezone, safecheck, assign_cols_by_name,
                                              df_for_struct)