From c10b57786a5fad615036a14d0eb22e258f34ad11 Mon Sep 17 00:00:00 2001
From: Shixiong Zhu <zsxwing@gmail.com>
Date: Fri, 10 Dec 2021 00:20:49 -0800
Subject: [PATCH 1/3] optimize lit

---
 .../scala/org/apache/spark/sql/functions.scala    | 15 ++++++++++++++-
 .../apache/spark/sql/ColumnExpressionSuite.scala  | 12 ++++++++++++
 2 files changed, 26 insertions(+), 1 deletion(-)

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
index 8192350baa06..cda9e895b106 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
@@ -113,7 +113,17 @@ object functions {
    * @group normal_funcs
    * @since 1.3.0
    */
-  def lit(literal: Any): Column = typedLit(literal)
+  def lit(literal: Any): Column = literal match {
+    case c: Column => c
+    case s: Symbol => new ColumnName(s.name)
+    case _ =>
+      // This is different from `typedLit`. `typedLit` calls `Literal.create` to use
+      // `ScalaReflection` to get the type of `literal`. However, since we use `Any` in this method,
+      // `typedLit[Any](literal)` will always fail and fallback to `Literal.apply`. Hence, we can
+      // just manually call `Literal.apply` to skip the expensive `ScalaReflection` code. This is
+      // significantly better when there are many threads calling `lit` concurrently.
+      Column(Literal(literal))
+  }
 
   /**
    * Creates a [[Column]] of literal value.
@@ -134,6 +144,9 @@ object functions {
    * The difference between this function and [[lit]] is that this function
    * can handle parameterized scala types e.g.: List, Seq and Map.
    *
+   * Note: `typedLit` will call expensive Scala reflection APIs. `lit` is preferred if parameterized
+   * scala types are not used.
+   *
    * @group normal_funcs
    * @since 3.2.0
    */
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/ColumnExpressionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/ColumnExpressionSuite.scala
index 2acc4ff68796..fe56bcb99117 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/ColumnExpressionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/ColumnExpressionSuite.scala
@@ -932,7 +932,19 @@ class ColumnExpressionSuite extends QueryTest with SharedSparkSession {
       testData2.collect().toSeq.map(r => Row(r.getInt(0) ^ r.getInt(1) ^ 39)))
   }
 
+  test("SPARK-37646: lit") {
+    assert(lit($"foo") == $"foo")
+    assert(lit('foo) == $"foo")
+    assert(lit(1) == Column(Literal(1)))
+    assert(lit(null) == Column(Literal(null, NullType)))
+  }
+
   test("typedLit") {
+    assert(typedLit($"foo") == $"foo")
+    assert(typedLit('foo) == $"foo")
+    assert(typedLit(1) == Column(Literal(1)))
+    assert(typedLit[String](null) == Column(Literal(null, StringType)))
+
     val df = Seq(Tuple1(0)).toDF("a")
     // Only check the types `lit` cannot handle
     checkAnswer(

From f288b9f3c4b0eb70d34f241c6a215afa0a8db355 Mon Sep 17 00:00:00 2001
From: Shixiong Zhu <zsxwing@gmail.com>
Date: Tue, 14 Dec 2021 16:17:49 -0800
Subject: [PATCH 2/3] typedLit -> typedlit in comment

---
 sql/core/src/main/scala/org/apache/spark/sql/functions.scala | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
index cda9e895b106..d79335ba0cc9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
@@ -117,7 +117,7 @@ object functions {
     case c: Column => c
     case s: Symbol => new ColumnName(s.name)
     case _ =>
-      // This is different from `typedLit`. `typedLit` calls `Literal.create` to use
+      // This is different from `typedlit`. `typedlit` calls `Literal.create` to use
       // `ScalaReflection` to get the type of `literal`. However, since we use `Any` in this method,
       // `typedLit[Any](literal)` will always fail and fallback to `Literal.apply`. Hence, we can
       // just manually call `Literal.apply` to skip the expensive `ScalaReflection` code. This is
@@ -144,7 +144,7 @@ object functions {
    * The difference between this function and [[lit]] is that this function
    * can handle parameterized scala types e.g.: List, Seq and Map.
    *
-   * Note: `typedLit` will call expensive Scala reflection APIs. `lit` is preferred if parameterized
+   * Note: `typedlit` will call expensive Scala reflection APIs. `lit` is preferred if parameterized
    * scala types are not used.
    *
    * @group normal_funcs

From d287a4abba7ea125f3eb13a55e6d6b53a467b111 Mon Sep 17 00:00:00 2001
From: Shixiong Zhu <shixiong@databricks.com>
Date: Tue, 14 Dec 2021 16:49:28 -0800
Subject: [PATCH 3/3] Update
 sql/core/src/main/scala/org/apache/spark/sql/functions.scala

Co-authored-by: Hyukjin Kwon <gurwls223@gmail.com>
---
 sql/core/src/main/scala/org/apache/spark/sql/functions.scala | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
index d79335ba0cc9..ec28d8dde38e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/functions.scala
@@ -144,8 +144,8 @@ object functions {
    * The difference between this function and [[lit]] is that this function
    * can handle parameterized scala types e.g.: List, Seq and Map.
    *
-   * Note: `typedlit` will call expensive Scala reflection APIs. `lit` is preferred if parameterized
-   * scala types are not used.
+   * @note `typedlit` will call expensive Scala reflection APIs. `lit` is preferred if parameterized
+   * Scala types are not used.
    *
    * @group normal_funcs
    * @since 3.2.0