What the SparkSession Does
from pyspark.sql import SparkSession
# Create the single entry point to Spark
spark = SparkSession.builder \
.appName('nordgrid-daily-pipeline') \
.getOrCreate()
# Everything flows through the spark object
df = spark.read.csv('bronze/meters/') # read data
df.createOrReplaceTempView('meters') # register for SQL
result = spark.sql('SELECT * FROM meters') # run SQL
spark.conf.get('spark.sql.shuffle.partitions') # read config
print(type(spark)) # <class 'pyspark.sql.session.SparkSession'>








