@@ -1454,8 +1454,7 @@ def regexp_like(
14541454 >>> df = ctx.from_pydict({"a": ["hello123"]})
14551455 >>> result = df.select(
14561456 ... dfn.functions.regexp_like(
1457- ... dfn.col("a"), dfn.lit("\\d+")
1458- ... ).alias("m")
1457+ ... dfn.col("a"), "\\d+").alias("m")
14591458 ... )
14601459 >>> result.collect_column("m")[0].as_py()
14611460 True
@@ -1464,8 +1463,8 @@ def regexp_like(
14641463
14651464 >>> result = df.select(
14661465 ... dfn.functions.regexp_like(
1467- ... dfn.col("a"), dfn.lit( "HELLO") ,
1468- ... flags=dfn.lit( "i") ,
1466+ ... dfn.col("a"), "HELLO",
1467+ ... flags="i",
14691468 ... ).alias("m")
14701469 ... )
14711470 >>> result.collect_column("m")[0].as_py()
@@ -1488,8 +1487,7 @@ def regexp_match(
14881487 >>> df = ctx.from_pydict({"a": ["hello 42 world"]})
14891488 >>> result = df.select(
14901489 ... dfn.functions.regexp_match(
1491- ... dfn.col("a"), dfn.lit("(\\d+)")
1492- ... ).alias("m")
1490+ ... dfn.col("a"), "(\\d+)").alias("m")
14931491 ... )
14941492 >>> result.collect_column("m")[0].as_py()
14951493 ['42']
@@ -1498,8 +1496,8 @@ def regexp_match(
14981496
14991497 >>> result = df.select(
15001498 ... dfn.functions.regexp_match(
1501- ... dfn.col("a"), dfn.lit( "(HELLO)") ,
1502- ... flags=dfn.lit( "i") ,
1499+ ... dfn.col("a"), "(HELLO)",
1500+ ... flags="i",
15031501 ... ).alias("m")
15041502 ... )
15051503 >>> result.collect_column("m")[0].as_py()
@@ -1528,8 +1526,8 @@ def regexp_replace(
15281526 >>> df = ctx.from_pydict({"a": ["hello 42"]})
15291527 >>> result = df.select(
15301528 ... dfn.functions.regexp_replace(
1531- ... dfn.col("a"), dfn.lit( "\\d+") ,
1532- ... dfn.lit( "XX")
1529+ ... dfn.col("a"), "\\d+",
1530+ ... "XX"
15331531 ... ).alias("r")
15341532 ... )
15351533 >>> result.collect_column("r")[0].as_py()
@@ -1540,8 +1538,8 @@ def regexp_replace(
15401538 >>> df = ctx.from_pydict({"a": ["a1 b2 c3"]})
15411539 >>> result = df.select(
15421540 ... dfn.functions.regexp_replace(
1543- ... dfn.col("a"), dfn.lit( "\\d+") ,
1544- ... dfn.lit( "X") , flags=dfn.lit( "g") ,
1541+ ... dfn.col("a"), "\\d+",
1542+ ... "X", flags="g",
15451543 ... ).alias("r")
15461544 ... )
15471545 >>> result.collect_column("r")[0].as_py()
@@ -1556,7 +1554,7 @@ def regexp_replace(
15561554def regexp_count (
15571555 string : Expr ,
15581556 pattern : Expr | str ,
1559- start : Expr | str | None = None ,
1557+ start : Expr | int | None = None ,
15601558 flags : Expr | str | None = None ,
15611559) -> Expr :
15621560 """Returns the number of matches in a string.
@@ -1569,8 +1567,7 @@ def regexp_count(
15691567 >>> df = ctx.from_pydict({"a": ["abcabc"]})
15701568 >>> result = df.select(
15711569 ... dfn.functions.regexp_count(
1572- ... dfn.col("a"), dfn.lit("abc")
1573- ... ).alias("c"))
1570+ ... dfn.col("a"), "abc").alias("c"))
15741571 >>> result.collect_column("c")[0].as_py()
15751572 2
15761573
@@ -1579,8 +1576,8 @@ def regexp_count(
15791576
15801577 >>> result = df.select(
15811578 ... dfn.functions.regexp_count(
1582- ... dfn.col("a"), dfn.lit( "ABC") ,
1583- ... start=dfn.lit(4) , flags=dfn.lit( "i") ,
1579+ ... dfn.col("a"), "ABC",
1580+ ... start=4 , flags="i",
15841581 ... ).alias("c"))
15851582 >>> result.collect_column("c")[0].as_py()
15861583 1
@@ -1595,10 +1592,10 @@ def regexp_count(
15951592def regexp_instr (
15961593 values : Expr ,
15971594 regex : Expr | str ,
1598- start : Expr | str | None = None ,
1599- n : Expr | str | None = None ,
1595+ start : Expr | int | None = None ,
1596+ n : Expr | int | None = None ,
16001597 flags : Expr | str | None = None ,
1601- sub_expr : Expr | str | None = None ,
1598+ sub_expr : Expr | int | None = None ,
16021599) -> Expr :
16031600 r"""Returns the position of a regular expression match in a string.
16041601
@@ -1615,8 +1612,7 @@ def regexp_instr(
16151612 >>> df = ctx.from_pydict({"a": ["hello 42 world"]})
16161613 >>> result = df.select(
16171614 ... dfn.functions.regexp_instr(
1618- ... dfn.col("a"), dfn.lit("\\d+")
1619- ... ).alias("pos")
1615+ ... dfn.col("a"), "\\d+").alias("pos")
16201616 ... )
16211617 >>> result.collect_column("pos")[0].as_py()
16221618 7
@@ -1627,9 +1623,9 @@ def regexp_instr(
16271623 >>> df = ctx.from_pydict({"a": ["abc ABC abc"]})
16281624 >>> result = df.select(
16291625 ... dfn.functions.regexp_instr(
1630- ... dfn.col("a"), dfn.lit( "abc") ,
1631- ... start=dfn.lit(2) , n=dfn.lit(1) ,
1632- ... flags=dfn.lit( "i") ,
1626+ ... dfn.col("a"), "abc",
1627+ ... start=2 , n=1 ,
1628+ ... flags="i",
16331629 ... ).alias("pos")
16341630 ... )
16351631 >>> result.collect_column("pos")[0].as_py()
@@ -1639,8 +1635,8 @@ def regexp_instr(
16391635
16401636 >>> result = df.select(
16411637 ... dfn.functions.regexp_instr(
1642- ... dfn.col("a"), dfn.lit( "(abc)") ,
1643- ... sub_expr=dfn.lit(1) ,
1638+ ... dfn.col("a"), "(abc)",
1639+ ... sub_expr=1 ,
16441640 ... ).alias("pos")
16451641 ... )
16461642 >>> result.collect_column("pos")[0].as_py()
0 commit comments