Skip to content

Instantly share code, notes, and snippets.

from pyspark.sql import functions as F
from pyspark.sql.functions import pandas_udf, PandasUDFType
from pyspark.sql.types import *
import pandas as pd
df = spark.read\
.option("header", "true")\
.option("inferSchema", "true")\
.csv("yellow_tripdata_2017-06.csv")