Skip to content

Instantly share code, notes, and snippets.

View tdpetrou's full-sized avatar
💪

Ted Petrou tdpetrou

💪
View GitHub Profile
import pandas as pd
housing = pd.read_csv('http://bit.ly/kagglehousingtrain')
cols = ['GrLivArea', 'GarageArea']
X = housing[cols].values
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import KFold, cross_val_score
from sklearn.tree import DecisionTreeRegressor
ss = StandardScaler()
@tdpetrou
tdpetrou / basictransformer.py
Last active September 7, 2023 13:44
A custom scikit-learn transformer for one-hot encoding categorical values, and standardizing numeric columns
import pandas as pd
import numpy as np
from sklearn.base import BaseEstimator
class BasicTransformer(BaseEstimator):
def __init__(self, cat_threshold=None, num_strategy='median', return_df=False):
# store parameters as public attributes
self.cat_threshold = cat_threshold