diff --git a/python/pyspark/sql/functions/builtin.py b/python/pyspark/sql/functions/builtin.py index 344ba8d009ac4..1bdd2dbd8f016 100644 --- a/python/pyspark/sql/functions/builtin.py +++ b/python/pyspark/sql/functions/builtin.py @@ -7305,36 +7305,36 @@ def lag(col: "ColumnOrName", offset: int = 1, default: Optional[Any] = None) -> | b| 2| +---+---+ >>> w = Window.partitionBy("c1").orderBy("c2") - >>> df.withColumn("previos_value", lag("c2").over(w)).show() - +---+---+-------------+ - | c1| c2|previos_value| - +---+---+-------------+ - | a| 1| NULL| - | a| 2| 1| - | a| 3| 2| - | b| 2| NULL| - | b| 8| 2| - +---+---+-------------+ - >>> df.withColumn("previos_value", lag("c2", 1, 0).over(w)).show() - +---+---+-------------+ - | c1| c2|previos_value| - +---+---+-------------+ - | a| 1| 0| - | a| 2| 1| - | a| 3| 2| - | b| 2| 0| - | b| 8| 2| - +---+---+-------------+ - >>> df.withColumn("previos_value", lag("c2", 2, -1).over(w)).show() - +---+---+-------------+ - | c1| c2|previos_value| - +---+---+-------------+ - | a| 1| -1| - | a| 2| -1| - | a| 3| 1| - | b| 2| -1| - | b| 8| -1| - +---+---+-------------+ + >>> df.withColumn("previous_value", lag("c2").over(w)).show() + +---+---+--------------+ + | c1| c2|previous_value| + +---+---+--------------+ + | a| 1| NULL| + | a| 2| 1| + | a| 3| 2| + | b| 2| NULL| + | b| 8| 2| + +---+---+--------------+ + >>> df.withColumn("previous_value", lag("c2", 1, 0).over(w)).show() + +---+---+--------------+ + | c1| c2|previous_value| + +---+---+--------------+ + | a| 1| 0| + | a| 2| 1| + | a| 3| 2| + | b| 2| 0| + | b| 8| 2| + +---+---+--------------+ + >>> df.withColumn("previous_value", lag("c2", 2, -1).over(w)).show() + +---+---+--------------+ + | c1| c2|previous_value| + +---+---+--------------+ + | a| 1| -1| + | a| 2| -1| + | a| 3| 1| + | b| 2| -1| + | b| 8| -1| + +---+---+--------------+ """ from pyspark.sql.classic.column import _to_java_column