Skip to content

Instantly share code, notes, and snippets.

@SimonCoulombe
Created August 26, 2019 15:41
Show Gist options
  • Save SimonCoulombe/9bd079070d37cbe8fabf8d8bb4a90c4d to your computer and use it in GitHub Desktop.
Save SimonCoulombe/9bd079070d37cbe8fabf8d8bb4a90c4d to your computer and use it in GitHub Desktop.
# titanic data wrangling from https://rstudio-pubs-static.s3.amazonaws.com/324727_11ac0b6dbc77464da7b9de8c0f347463.html
# IMPORTANT: Only objectives 'binary:logistic', 'reg:linear', 'reg:logistic', 'binary:logitraw' are supported yet.
library(titanic) # data
library(tidypredict) # convert model to sql string
library(dummies)
library(dplyr)
library(dbplyr)
library(magrittr)
library(xgboost)
data("titanic_train")
data("titanic_test")
complete_data <- dplyr::bind_rows(titanic_train, titanic_test)
# count of NA's
colSums(is.na(complete_data))
# count of empty strings
colSums(complete_data=='')
# number of unique values
sapply(complete_data, function(x) length(unique(x)))
## Missing values imputation
complete_data$Embarked[complete_data$Embarked==""] <- "S"
complete_data$Age[is.na(complete_data$Age)] <- median(complete_data$Age,na.rm=T)
## Removing Cabin as it has very high missing values, passengerId, Ticket and Name are not required
titanic_data <- complete_data %>% select(-c(Cabin, PassengerId, Ticket, Name))
## Converting ,"Pclass","Sex","Embarked" to factors
for (i in c("Pclass","Sex","Embarked")){
titanic_data[,i]=as.factor(titanic_data[,i])
}
## Create dummy variables for categorical variables
titanic_data <- dummy.data.frame(titanic_data, names=c("Pclass","Sex","Embarked"), sep="_")
label_var <- "Survived"
feature_vars <- titanic_data %>%
select(-one_of(c(label_var))) %>%
colnames()
train <- titanic_data[1:nrow(titanic_train),]
test <- titanic_data[nrow(titanic_train)+1:nrow(titanic_data),]
train_xgbmatrix <- xgb.DMatrix(
data = train %>% select(feature_vars) %>% as.matrix,
label = train %>% pull(label_var),
missing = "NAN")
param <- list(
max.depth = 6,
eta = .01,
gamma = 0,
subsample = 0.8,
min_child_weight=3,
colsample_bytree = 0.8,
objective = 'binary:logistic'
)
full_model <- xgb.train(
data = train_xgbmatrix,
params = param,
nrounds = 10
)
sql_code <- tidypredict_sql(full_model, dbplyr::simulate_postgres())
#
# > sql_code
# <SQL> 1.0 - 1.0 / (1.0 + EXP(0.0 + CASE
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00434782589)
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0169444438)
# WHEN ((`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.015030303)
# WHEN (`Fare` >= 22.90415 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0130434781)
# WHEN ((`Fare` < 27.1353989 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00200000009)
# WHEN (`Age` >= 28.5 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00333333341)
# WHEN (`Fare` >= 15.3729 AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0104761906)
# WHEN ((`Fare` < 31.1375008 OR ((`Fare`) IS NULL)) AND (`Fare` < 52.2770996 OR ((`Fare`) IS NULL)) AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00666666683)
# WHEN (`Fare` >= 31.1375008 AND (`Fare` < 52.2770996 OR ((`Fare`) IS NULL)) AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0137499999)
# WHEN ((`Fare` < 59.0875015 OR ((`Fare`) IS NULL)) AND `Fare` >= 52.2770996 AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00499999989)
# WHEN (`Fare` >= 59.0875015 AND `Fare` >= 52.2770996 AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00699999975)
# WHEN ((`Fare` < 8.03960037 OR ((`Fare`) IS NULL)) AND (`Fare` < 15.3729 OR ((`Fare`) IS NULL)) AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0088888891)
# WHEN (`Fare` >= 8.03960037 AND (`Fare` < 15.3729 OR ((`Fare`) IS NULL)) AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00166666671)
# END + CASE
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0169169754)
# WHEN ((`Age` < 3.5 OR ((`Age`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00349617656)
# WHEN (`Age` >= 3.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0152933113)
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00366668426)
# WHEN (`Embarked_Q` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00704338402)
# WHEN (`Age` >= 53.0 AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0112415785)
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00473228516)
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00992533937)
# WHEN (`Parch` >= 1.5 AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0103086075)
# WHEN ((`Age` < 36.5 OR ((`Age`) IS NULL)) AND `Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00670130365)
# WHEN (`Age` >= 36.5 AND `Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0039536613)
# WHEN ((`Age` < 29.0 OR ((`Age`) IS NULL)) AND (`Parch` < 1.5 OR ((`Parch`) IS NULL)) AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0044792355)
# WHEN (`Age` >= 29.0 AND (`Parch` < 1.5 OR ((`Parch`) IS NULL)) AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00102121115)
# END + CASE
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.017226452)
# WHEN ((`Fare` < 26.9500008 OR ((`Fare`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0111564742)
# WHEN (`Fare` >= 26.9500008 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00104449317)
# WHEN ((`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0150618982)
# WHEN (`Fare` >= 22.90415 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0128734633)
# WHEN ((`Fare` < 26.7749996 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00201320695)
# WHEN ((`Fare` < 7.88749981 OR ((`Fare`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00789490249)
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0121291038)
# WHEN ((`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0104477014)
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0076236045)
# WHEN (`SibSp` >= 0.5 AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00127887854)
# WHEN ((`Age` < 14.25 OR ((`Age`) IS NULL)) AND `Fare` >= 10.8249998 AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0105509097)
# WHEN (`Age` >= 14.25 AND `Fare` >= 10.8249998 AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00126365363)
# END + CASE
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00711674197)
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0174564831)
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0147035634)
# WHEN ((`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00624701194)
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0114857405)
# WHEN ((`Age` < 20.5 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00275264238)
# WHEN (`Age` >= 20.5 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00474784104)
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0122412276)
# WHEN (`Age` >= 30.5 AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00586984493)
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (4.02321457e-05)
# WHEN (`Age` >= 27.5 AND (`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0105560161)
# WHEN ((`Age` < 37.5 OR ((`Age`) IS NULL)) AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00527896453)
# WHEN (`Age` >= 37.5 AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00574399857)
# END + CASE
# WHEN (`Pclass_1` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0174164735)
# WHEN ((`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 13.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0142651545)
# WHEN (`SibSp` >= 2.5 AND (`Age` < 13.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0132637918)
# WHEN (`SibSp` >= 2.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.00925219525)
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0155283092)
# WHEN (`Embarked_C` >= 0.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.010165615)
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.012750349)
# WHEN ((`Age` < 8.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.015696073)
# WHEN ((`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00611250801)
# WHEN ((`Age` < 18.5 OR ((`Age`) IS NULL)) AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00150432985)
# WHEN ((`Age` < 37.5 OR ((`Age`) IS NULL)) AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00585781876)
# WHEN (`Age` >= 37.5 AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0043284446)
# WHEN ((`Age` < 36.5 OR ((`Age`) IS NULL)) AND `Age` >= 18.5 AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00814614445)
# WHEN (`Age` >= 36.5 AND `Age` >= 18.5 AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00257276115)
# END + CASE
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0172553938)
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Fare` < 15.1729002 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0145200891)
# WHEN (`SibSp` >= 0.5 AND (`Fare` < 15.1729002 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00783024263)
# WHEN (`SibSp` >= 2.5 AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0150947757)
# WHEN (`Fare` >= 23.7000008 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0132566504)
# WHEN ((`Fare` < 26.1437492 OR ((`Fare`) IS NULL)) AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149228703)
# WHEN ((`Fare` < 22.0125008 OR ((`Fare`) IS NULL)) AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00344564347)
# WHEN ((`Fare` < 13.9354496 OR ((`Fare`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00938407332)
# WHEN (`Fare` >= 13.9354496 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.000752933323)
# WHEN (`Fare` >= 10.8249998 AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00430147443)
# WHEN ((`Fare` < 27.1353989 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.1437492 AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00325194863)
# WHEN (`Fare` >= 27.1353989 AND `Fare` >= 26.1437492 AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00651466195)
# WHEN ((`Fare` < 36.8770981 OR ((`Fare`) IS NULL)) AND `Fare` >= 22.0125008 AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00787981879)
# WHEN (`Fare` >= 36.8770981 AND `Fare` >= 22.0125008 AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00314199668)
# WHEN ((`Fare` < 7.98750019 OR ((`Fare`) IS NULL)) AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-8.59395514e-05)
# WHEN (`Fare` >= 7.98750019 AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00657150801)
# END + CASE
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0165820513)
# WHEN ((`Age` < 16.5 OR ((`Age`) IS NULL)) AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00138106104)
# WHEN (`SibSp` >= 2.5 AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0157281347)
# WHEN (`Fare` >= 23.3500004 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0124043347)
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0148912258)
# WHEN ((`Fare` < 7.5625 OR ((`Fare`) IS NULL)) AND `Embarked_C` >= 0.5 AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0130371349)
# WHEN (`Fare` >= 7.5625 AND `Embarked_C` >= 0.5 AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0025235021)
# WHEN (`SibSp` >= 0.5 AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00371552329)
# WHEN (`SibSp` >= 0.5 AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00234823627)
# WHEN ((`Fare` < 8.00835037 OR ((`Fare`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0103895292)
# WHEN (`Fare` >= 8.00835037 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00343621452)
# WHEN (`Fare` >= 10.8249998 AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00365704834)
# WHEN ((`Fare` < 30.5979004 OR ((`Fare`) IS NULL)) AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00683598779)
# WHEN (`Fare` >= 30.5979004 AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.000373432558)
# WHEN ((`Fare` < 31.6604004 OR ((`Fare`) IS NULL)) AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00503891986)
# WHEN (`Fare` >= 31.6604004 AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149384765)
# WHEN ((`Fare` < 7.98750019 OR ((`Fare`) IS NULL)) AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00189721282)
# WHEN (`Fare` >= 7.98750019 AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0078471601)
# END + CASE
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00661299704)
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0165493432)
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0141193997)
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0119009716)
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00629326282)
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00306293718)
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00131507707)
# WHEN ((`Age` < 17.0 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00376045983)
# WHEN (`Age` >= 17.0 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-3.76139797e-05)
# WHEN ((`Age` < 29.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0130316792)
# WHEN (`Age` >= 29.5 AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00310476124)
# WHEN ((`Age` < 33.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00891405623)
# WHEN (`Age` >= 33.5 AND `Age` >= 27.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00187885517)
# END + CASE
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.015667025)
# WHEN ((`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0144493645)
# WHEN (`SibSp` >= 1.5 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0101849688)
# WHEN (`Pclass_3` >= 0.5 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0140106445)
# WHEN (`Pclass_2` >= 0.5 AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149726421)
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00812884886)
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00324438047)
# WHEN (`SibSp` >= 1.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0134938397)
# WHEN (`Age` >= 53.0 AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.011087507)
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00593874184)
# WHEN (`Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0018952667)
# WHEN ((`Age` < 21.5 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00219260831)
# WHEN (`Age` >= 21.5 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00342541724)
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 27.5 AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00868774112)
# WHEN (`SibSp` >= 0.5 AND `Age` >= 27.5 AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00330167799)
# END + CASE
# WHEN (`Pclass_1` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0160517655)
# WHEN ((`Fare` < 26.9500008 OR ((`Fare`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0104249204)
# WHEN (`Fare` >= 26.9500008 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00200724951)
# WHEN (`Pclass_2` >= 0.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0152612738)
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0151267061)
# WHEN ((`Fare` < 26.7749996 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00611572061)
# WHEN (`Fare` >= 20.7999992 AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.0140776485)
# WHEN ((`Fare` < 8.6875 OR ((`Fare`) IS NULL)) AND `Embarked_C` >= 0.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0112189986)
# WHEN (`Fare` >= 8.6875 AND `Embarked_C` >= 0.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00504898885)
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.011719726)
# WHEN ((`Age` < 16.5 OR ((`Age`) IS NULL)) AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0101430472)
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00742811617)
# WHEN (`SibSp` >= 0.5 AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00165399665)
# WHEN ((`Fare` < 7.88749981 OR ((`Fare`) IS NULL)) AND `Age` >= 16.5 AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00621310156)
# WHEN (`Fare` >= 7.88749981 AND `Age` >= 16.5 AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.00261630863)
# END))
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment