Skip to content

Instantly share code, notes, and snippets.

@masterdezign
Created November 1, 2021 17:35
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save masterdezign/0bbd663be11d8901c179db0cd0dab3cf to your computer and use it in GitHub Desktop.
Save masterdezign/0bbd663be11d8901c179db0cd0dab3cf to your computer and use it in GitHub Desktop.
import pandas as pd
# .read_csv()
# .shape
# .head(N) .tail(N)
# .dtypes
# .loc[3, 'sepal_length'] .iloc
# .to_csv()
# pd.set_option('max_columns', 2)
# pd.options.display.float_format = '{:,.2f}'.format
# .isna()
# .cumsum(skipna=False)
# df['Profit'] = df.apply(lambda x:..., axis=1)
# df['Xx'].map()
# df.applymap(lambda x: len(str(x))) # To every element
# .pivot .stack
# .plot()
# .plot.area(stacked=False)
# .boxplot()
# .describe()
# .corr()
# Packages
# - pandas_profiling
# from pandas_profiling import ProfileReport
# profile = ProfileReport(df, title="Title")
# profile.to_notebook_iframe()
# Dask - parallel computing
# import dask.dataframe as dd
# df = dd.read_csv('...')
# Koalas -> Pandas API to Apache Spark
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment