19 lines
599 B
Python
19 lines
599 B
Python
from pyspark.sql import SparkSession
|
|
|
|
spark = SparkSession.builder.appName("").getOrCreate()
|
|
|
|
print("creating database")
|
|
spark.sql('CREATE DATABASE IF NOT EXISTS marketing')
|
|
|
|
print("creating table")
|
|
spark.sql('''
|
|
CREATE TABLE IF NOT EXISTS marketing.ad_clicks (
|
|
user_id INT,
|
|
ad_id INT,
|
|
click_timestamp TIMESTAMP,
|
|
impression_timestamp TIMESTAMP
|
|
)
|
|
USING iceberg
|
|
PARTITIONED BY (ad_id)
|
|
''')
|