Created
August 26, 2019 15:41
-
-
Save SimonCoulombe/9bd079070d37cbe8fabf8d8bb4a90c4d to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# titanic data wrangling from https://rstudio-pubs-static.s3.amazonaws.com/324727_11ac0b6dbc77464da7b9de8c0f347463.html | |
# IMPORTANT: Only objectives 'binary:logistic', 'reg:linear', 'reg:logistic', 'binary:logitraw' are supported yet. | |
library(titanic) # data | |
library(tidypredict) # convert model to sql string | |
library(dummies) | |
library(dplyr) | |
library(dbplyr) | |
library(magrittr) | |
library(xgboost) | |
data("titanic_train") | |
data("titanic_test") | |
complete_data <- dplyr::bind_rows(titanic_train, titanic_test) | |
# count of NA's | |
colSums(is.na(complete_data)) | |
# count of empty strings | |
colSums(complete_data=='') | |
# number of unique values | |
sapply(complete_data, function(x) length(unique(x))) | |
## Missing values imputation | |
complete_data$Embarked[complete_data$Embarked==""] <- "S" | |
complete_data$Age[is.na(complete_data$Age)] <- median(complete_data$Age,na.rm=T) | |
## Removing Cabin as it has very high missing values, passengerId, Ticket and Name are not required | |
titanic_data <- complete_data %>% select(-c(Cabin, PassengerId, Ticket, Name)) | |
## Converting ,"Pclass","Sex","Embarked" to factors | |
for (i in c("Pclass","Sex","Embarked")){ | |
titanic_data[,i]=as.factor(titanic_data[,i]) | |
} | |
## Create dummy variables for categorical variables | |
titanic_data <- dummy.data.frame(titanic_data, names=c("Pclass","Sex","Embarked"), sep="_") | |
label_var <- "Survived" | |
feature_vars <- titanic_data %>% | |
select(-one_of(c(label_var))) %>% | |
colnames() | |
train <- titanic_data[1:nrow(titanic_train),] | |
test <- titanic_data[nrow(titanic_train)+1:nrow(titanic_data),] | |
train_xgbmatrix <- xgb.DMatrix( | |
data = train %>% select(feature_vars) %>% as.matrix, | |
label = train %>% pull(label_var), | |
missing = "NAN") | |
param <- list( | |
max.depth = 6, | |
eta = .01, | |
gamma = 0, | |
subsample = 0.8, | |
min_child_weight=3, | |
colsample_bytree = 0.8, | |
objective = 'binary:logistic' | |
) | |
full_model <- xgb.train( | |
data = train_xgbmatrix, | |
params = param, | |
nrounds = 10 | |
) | |
sql_code <- tidypredict_sql(full_model, dbplyr::simulate_postgres()) | |
# | |
# > sql_code | |
# <SQL> 1.0 - 1.0 / (1.0 + EXP(0.0 + CASE | |
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00434782589) | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0169444438) | |
# WHEN ((`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.015030303) | |
# WHEN (`Fare` >= 22.90415 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0130434781) | |
# WHEN ((`Fare` < 27.1353989 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00200000009) | |
# WHEN (`Age` >= 28.5 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00333333341) | |
# WHEN (`Fare` >= 15.3729 AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0104761906) | |
# WHEN ((`Fare` < 31.1375008 OR ((`Fare`) IS NULL)) AND (`Fare` < 52.2770996 OR ((`Fare`) IS NULL)) AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00666666683) | |
# WHEN (`Fare` >= 31.1375008 AND (`Fare` < 52.2770996 OR ((`Fare`) IS NULL)) AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0137499999) | |
# WHEN ((`Fare` < 59.0875015 OR ((`Fare`) IS NULL)) AND `Fare` >= 52.2770996 AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00499999989) | |
# WHEN (`Fare` >= 59.0875015 AND `Fare` >= 52.2770996 AND `Fare` >= 27.1353989 AND `Fare` >= 26.2687492 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00699999975) | |
# WHEN ((`Fare` < 8.03960037 OR ((`Fare`) IS NULL)) AND (`Fare` < 15.3729 OR ((`Fare`) IS NULL)) AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0088888891) | |
# WHEN (`Fare` >= 8.03960037 AND (`Fare` < 15.3729 OR ((`Fare`) IS NULL)) AND (`Age` < 28.5 OR ((`Age`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00166666671) | |
# END + CASE | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0169169754) | |
# WHEN ((`Age` < 3.5 OR ((`Age`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00349617656) | |
# WHEN (`Age` >= 3.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0152933113) | |
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00366668426) | |
# WHEN (`Embarked_Q` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00704338402) | |
# WHEN (`Age` >= 53.0 AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0112415785) | |
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00473228516) | |
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00992533937) | |
# WHEN (`Parch` >= 1.5 AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0103086075) | |
# WHEN ((`Age` < 36.5 OR ((`Age`) IS NULL)) AND `Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00670130365) | |
# WHEN (`Age` >= 36.5 AND `Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Pclass_1` >= 0.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0039536613) | |
# WHEN ((`Age` < 29.0 OR ((`Age`) IS NULL)) AND (`Parch` < 1.5 OR ((`Parch`) IS NULL)) AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0044792355) | |
# WHEN (`Age` >= 29.0 AND (`Parch` < 1.5 OR ((`Parch`) IS NULL)) AND (`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_Q` < 0.5 OR ((`Embarked_Q`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00102121115) | |
# END + CASE | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.017226452) | |
# WHEN ((`Fare` < 26.9500008 OR ((`Fare`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0111564742) | |
# WHEN (`Fare` >= 26.9500008 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00104449317) | |
# WHEN ((`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0150618982) | |
# WHEN (`Fare` >= 22.90415 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0128734633) | |
# WHEN ((`Fare` < 26.7749996 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00201320695) | |
# WHEN ((`Fare` < 7.88749981 OR ((`Fare`) IS NULL)) AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00789490249) | |
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0121291038) | |
# WHEN ((`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0104477014) | |
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0076236045) | |
# WHEN (`SibSp` >= 0.5 AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00127887854) | |
# WHEN ((`Age` < 14.25 OR ((`Age`) IS NULL)) AND `Fare` >= 10.8249998 AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0105509097) | |
# WHEN (`Age` >= 14.25 AND `Fare` >= 10.8249998 AND `Fare` >= 7.88749981 AND (`Fare` < 22.90415 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00126365363) | |
# END + CASE | |
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00711674197) | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0174564831) | |
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0147035634) | |
# WHEN ((`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00624701194) | |
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0114857405) | |
# WHEN ((`Age` < 20.5 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00275264238) | |
# WHEN (`Age` >= 20.5 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00474784104) | |
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0122412276) | |
# WHEN (`Age` >= 30.5 AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00586984493) | |
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (4.02321457e-05) | |
# WHEN (`Age` >= 27.5 AND (`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0105560161) | |
# WHEN ((`Age` < 37.5 OR ((`Age`) IS NULL)) AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00527896453) | |
# WHEN (`Age` >= 37.5 AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00574399857) | |
# END + CASE | |
# WHEN (`Pclass_1` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0174164735) | |
# WHEN ((`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 13.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0142651545) | |
# WHEN (`SibSp` >= 2.5 AND (`Age` < 13.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0132637918) | |
# WHEN (`SibSp` >= 2.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.00925219525) | |
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0155283092) | |
# WHEN (`Embarked_C` >= 0.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.010165615) | |
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.012750349) | |
# WHEN ((`Age` < 8.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.015696073) | |
# WHEN ((`Age` < 31.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00611250801) | |
# WHEN ((`Age` < 18.5 OR ((`Age`) IS NULL)) AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00150432985) | |
# WHEN ((`Age` < 37.5 OR ((`Age`) IS NULL)) AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00585781876) | |
# WHEN (`Age` >= 37.5 AND `Age` >= 31.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 13.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0043284446) | |
# WHEN ((`Age` < 36.5 OR ((`Age`) IS NULL)) AND `Age` >= 18.5 AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00814614445) | |
# WHEN (`Age` >= 36.5 AND `Age` >= 18.5 AND `Age` >= 8.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00257276115) | |
# END + CASE | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0172553938) | |
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Fare` < 15.1729002 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0145200891) | |
# WHEN (`SibSp` >= 0.5 AND (`Fare` < 15.1729002 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00783024263) | |
# WHEN (`SibSp` >= 2.5 AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0150947757) | |
# WHEN (`Fare` >= 23.7000008 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0132566504) | |
# WHEN ((`Fare` < 26.1437492 OR ((`Fare`) IS NULL)) AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149228703) | |
# WHEN ((`Fare` < 22.0125008 OR ((`Fare`) IS NULL)) AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00344564347) | |
# WHEN ((`Fare` < 13.9354496 OR ((`Fare`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00938407332) | |
# WHEN (`Fare` >= 13.9354496 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.000752933323) | |
# WHEN (`Fare` >= 10.8249998 AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00430147443) | |
# WHEN ((`Fare` < 27.1353989 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.1437492 AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00325194863) | |
# WHEN (`Fare` >= 27.1353989 AND `Fare` >= 26.1437492 AND (`Parch` < 0.5 OR ((`Parch`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00651466195) | |
# WHEN ((`Fare` < 36.8770981 OR ((`Fare`) IS NULL)) AND `Fare` >= 22.0125008 AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00787981879) | |
# WHEN (`Fare` >= 36.8770981 AND `Fare` >= 22.0125008 AND `Parch` >= 0.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 15.1729002 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00314199668) | |
# WHEN ((`Fare` < 7.98750019 OR ((`Fare`) IS NULL)) AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-8.59395514e-05) | |
# WHEN (`Fare` >= 7.98750019 AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.7000008 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00657150801) | |
# END + CASE | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0165820513) | |
# WHEN ((`Age` < 16.5 OR ((`Age`) IS NULL)) AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00138106104) | |
# WHEN (`SibSp` >= 2.5 AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0157281347) | |
# WHEN (`Fare` >= 23.3500004 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0124043347) | |
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0148912258) | |
# WHEN ((`Fare` < 7.5625 OR ((`Fare`) IS NULL)) AND `Embarked_C` >= 0.5 AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0130371349) | |
# WHEN (`Fare` >= 7.5625 AND `Embarked_C` >= 0.5 AND `Age` >= 16.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0025235021) | |
# WHEN (`SibSp` >= 0.5 AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00371552329) | |
# WHEN (`SibSp` >= 0.5 AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00234823627) | |
# WHEN ((`Fare` < 8.00835037 OR ((`Fare`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0103895292) | |
# WHEN (`Fare` >= 8.00835037 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00343621452) | |
# WHEN (`Fare` >= 10.8249998 AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00365704834) | |
# WHEN ((`Fare` < 30.5979004 OR ((`Fare`) IS NULL)) AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00683598779) | |
# WHEN (`Fare` >= 30.5979004 AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 36.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.000373432558) | |
# WHEN ((`Fare` < 31.6604004 OR ((`Fare`) IS NULL)) AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00503891986) | |
# WHEN (`Fare` >= 31.6604004 AND (`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 36.5 AND (`SibSp` < 2.5 OR ((`SibSp`) IS NULL)) AND `Fare` >= 26.2687492 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149384765) | |
# WHEN ((`Fare` < 7.98750019 OR ((`Fare`) IS NULL)) AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00189721282) | |
# WHEN (`Fare` >= 7.98750019 AND (`Fare` < 10.8249998 OR ((`Fare`) IS NULL)) AND `Embarked_S` >= 0.5 AND (`Fare` < 23.3500004 OR ((`Fare`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0078471601) | |
# END + CASE | |
# WHEN ((`Age` < 6.5 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00661299704) | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0165493432) | |
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0141193997) | |
# WHEN (`Age` >= 53.0 AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0119009716) | |
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00629326282) | |
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00306293718) | |
# WHEN ((`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00131507707) | |
# WHEN ((`Age` < 17.0 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00376045983) | |
# WHEN (`Age` >= 17.0 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-3.76139797e-05) | |
# WHEN ((`Age` < 29.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0130316792) | |
# WHEN (`Age` >= 29.5 AND `Age` >= 27.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00310476124) | |
# WHEN ((`Age` < 33.5 OR ((`Age`) IS NULL)) AND `Age` >= 27.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00891405623) | |
# WHEN (`Age` >= 33.5 AND `Age` >= 27.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Age` >= 6.5 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00187885517) | |
# END + CASE | |
# WHEN ((`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.015667025) | |
# WHEN ((`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0144493645) | |
# WHEN (`SibSp` >= 1.5 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0101849688) | |
# WHEN (`Pclass_3` >= 0.5 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0140106445) | |
# WHEN (`Pclass_2` >= 0.5 AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0149726421) | |
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00812884886) | |
# WHEN (`Embarked_C` >= 0.5 AND (`Embarked_S` < 0.5 OR ((`Embarked_S`) IS NULL)) AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00324438047) | |
# WHEN (`SibSp` >= 1.5 AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.0134938397) | |
# WHEN (`Age` >= 53.0 AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.011087507) | |
# WHEN ((`Age` < 30.5 OR ((`Age`) IS NULL)) AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00593874184) | |
# WHEN (`Age` >= 30.5 AND (`Age` < 53.0 OR ((`Age`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_3` < 0.5 OR ((`Pclass_3`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0018952667) | |
# WHEN ((`Age` < 21.5 OR ((`Age`) IS NULL)) AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00219260831) | |
# WHEN (`Age` >= 21.5 AND (`Age` < 27.5 OR ((`Age`) IS NULL)) AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.00342541724) | |
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Age` >= 27.5 AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00868774112) | |
# WHEN (`SibSp` >= 0.5 AND `Age` >= 27.5 AND (`SibSp` < 1.5 OR ((`SibSp`) IS NULL)) AND `Embarked_S` >= 0.5 AND `Pclass_3` >= 0.5 AND `Sex_female` >= 0.5) THEN (-0.00330167799) | |
# END + CASE | |
# WHEN (`Pclass_1` >= 0.5 AND `Sex_female` >= 0.5) THEN (0.0160517655) | |
# WHEN ((`Fare` < 26.9500008 OR ((`Fare`) IS NULL)) AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.0104249204) | |
# WHEN (`Fare` >= 26.9500008 AND (`Age` < 13.0 OR ((`Age`) IS NULL)) AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00200724951) | |
# WHEN (`Pclass_2` >= 0.5 AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0152612738) | |
# WHEN ((`Embarked_C` < 0.5 OR ((`Embarked_C`) IS NULL)) AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0151267061) | |
# WHEN ((`Fare` < 26.7749996 OR ((`Fare`) IS NULL)) AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (0.00611572061) | |
# WHEN (`Fare` >= 20.7999992 AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.0140776485) | |
# WHEN ((`Fare` < 8.6875 OR ((`Fare`) IS NULL)) AND `Embarked_C` >= 0.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.0112189986) | |
# WHEN (`Fare` >= 8.6875 AND `Embarked_C` >= 0.5 AND (`Fare` < 26.2687492 OR ((`Fare`) IS NULL)) AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00504898885) | |
# WHEN ((`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.011719726) | |
# WHEN ((`Age` < 16.5 OR ((`Age`) IS NULL)) AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.0101430472) | |
# WHEN ((`SibSp` < 0.5 OR ((`SibSp`) IS NULL)) AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00742811617) | |
# WHEN (`SibSp` >= 0.5 AND `Pclass_1` >= 0.5 AND `Fare` >= 26.7749996 AND `Fare` >= 26.2687492 AND `Age` >= 13.0 AND (`Sex_female` < 0.5 OR ((`Sex_female`) IS NULL))) THEN (-0.00165399665) | |
# WHEN ((`Fare` < 7.88749981 OR ((`Fare`) IS NULL)) AND `Age` >= 16.5 AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (0.00621310156) | |
# WHEN (`Fare` >= 7.88749981 AND `Age` >= 16.5 AND (`Fare` < 20.7999992 OR ((`Fare`) IS NULL)) AND (`Pclass_2` < 0.5 OR ((`Pclass_2`) IS NULL)) AND (`Pclass_1` < 0.5 OR ((`Pclass_1`) IS NULL)) AND `Sex_female` >= 0.5) THEN (-0.00261630863) | |
# END)) | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment