Skip to content

Instantly share code, notes, and snippets.

@szilard
Created August 27, 2017 03:48
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save szilard/0f90286629368af33fafe75060d66d6b to your computer and use it in GitHub Desktop.
Save szilard/0f90286629368af33fafe75060d66d6b to your computer and use it in GitHub Desktop.
Minimal lightgbm example
library(data.table)
library(ROCR)
library(lightgbm)
set.seed(123)
d_train <- fread("/var/data/bm-ml/train-0.1m.csv")
d_test <- fread("/var/data/bm-ml/test.csv")
d_train_test <- rbind(d_train, d_test)
d_train_test_xtra <- lgb.prepare_rules(d_train_test)
d_train_test <- d_train_test_xtra$data
cols_cats <- setdiff(names(d_train_test_xtra$rules),"dep_delayed_15min")
n1 <- nrow(d_train)
n2 <- nrow(d_test)
p <- ncol(d_train)-1
X_train <- as.matrix(d_train_test[1:n1,1:p])
X_test <- as.matrix(d_train_test[(n1+1):(n1+n2),1:p])
dlgb_train <- lgb.Dataset(data = X_train, label = ifelse(d_train$dep_delayed_15min=='Y',1,0))
system.time({
md <- lgb.train(data = dlgb_train, objective = "binary",
nrounds = 100, num_leaves = 512, learning_rate = 0.1, categorical_feature = cols_cats)
})
system.time({
phat <- predict(md, data = X_test)
})
rocr_pred <- prediction(phat, d_test$dep_delayed_15min)
performance(rocr_pred, "auc")@y.values[[1]]
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment