Skip to content

Instantly share code, notes, and snippets.

@MarcinMoskala
Created June 6, 2020 07:57
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save MarcinMoskala/5c65ca4c375bc1486c255bf2808a3a58 to your computer and use it in GitHub Desktop.
Save MarcinMoskala/5c65ca4c375bc1486c255bf2808a3a58 to your computer and use it in GitHub Desktop.
def add_day_month_year(df):
dates = df["Date"].map(lambda x: x[:10])
df["day_of_month"] = dates.map(lambda x: x.split("/")[1])
df["month"] = dates.map(lambda x: x.split("/")[0])
df["year"] = dates.map(lambda x: x.split("/")[2])
df["date"] = dates
return df
from pandas import read_csv
crimes_df = read_csv("CrimeData.csv")
crimes_df = add_day_month_year(crimes_df)
crimes_df = crimes_df[crimes_df.year <= 2019]
crimes_df = crimes_df[crimes_df["Primary Type"] == "BATTERY"] # "THEFT", ...
days_df = read_csv("DaysData.csv")
crimes_count_df = crimes_df \
.groupby(["year"]) \
.size() \
.to_frame("crimes") \
.reset_index()
print(crimes_count_df.to_string())
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment