from pyspark.sql import SparkSession
from pyspark.sql.functions import from_unixtime, unix_timestamp
# Initialize Spark session
spark = SparkSession.builder.appName("date_format_conversion").getOrCreate()
# Example data
data = [("3/6/2020",)]
df = spark.createDataFrame(data, ["date_string"])
# Convert date format from MM/dd/yyyy to yyyy-MM-dd
df_converted = df.withColumn("formatted_date",
from_unixtime(unix_timestamp("date_string", "MM/dd/yyyy"), "yyyy-MM-dd"))
df_converted.show()
Created
February 26, 2024 21:31
-
-
Save dvu4/17faf74428944aa646d42bdc34968c01 to your computer and use it in GitHub Desktop.
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment