Py Spark
Py Spark
# Sort results
df = df.orderBy(df.age.asc())
df = df.orderBy(df.age.desc())
# String functions
df = df.withColumn('short_id', df.id.substr(0, 10))
df = df.withColumn('name', F.trim(df.name))
df = df.withColumn('id', F.lpad('id', 4, '0'))
df = df.withColumn('full_name', F.concat('fname', F.lit(' '),
'lname'))
df = df.withColumn('full_name', F.concat_ws('-', 'fname',
'lname'))
df = df.withColumn('id', F.regexp_replace(id, '0F1(.*)', '1F1-
$1'))
df = df.withColumn('id', F.regexp_extract(id, '[0-9]*', 0))