Skip to content

Instantly share code, notes, and snippets.

View larkz's full-sized avatar
🤖

Larkin Liu larkz

🤖
View GitHub Profile
@larkz
larkz / test_gist.txt
Created October 10, 2021 10:49
test gist
This is a test 123!
@larkz
larkz / sandwellCustomerSegmentation.scala
Created June 13, 2016 17:44
User wallet and customer age segmentation
val num = "27"
val measurementData = sqlContext.read.parquet("/workspace/midgar/prod/ws/measurements/base")
val mData = measurementData.filter($"dateday" > "2016-05-31" && $"dateday" < "2016-06-10")
val mDataSubset = mData.select("customer_id", "channel", "group", "impression", "view", "click", "path_event_type", "dateday")
val salesOrderData = sqlContext.table("marketplace.sales_order_snapshot")//.filter($"created_at" < "2016-04-01" || $"created_at" > "2016-03-01")
val salesOrderData2 = salesOrderData.filter(!$"title".contains("Recharge")).filter(!$"title".contains("Bill Payment"))
@larkz
larkz / boltonFeatureGeneration.scala
Created June 13, 2016 02:45
Bolton Measurement Summary
val num = "27"
val measurementData = sqlContext.read.parquet("/workspace/midgar/prod/ws/measurements/base")
val mData = measurementData.filter($"dateday" > "2016-05-31" && $"dateday" < "2016-06-10")
val mDataSubset = mData.select("customer_id", "channel", "group", "impression", "view", "click", "path_event_type", "dateday")
val salesOrderData = sqlContext.table("marketplace.sales_order_snapshot")//.filter($"created_at" < "2016-04-01" || $"created_at" > "2016-03-01")
val salesOrderData2 = salesOrderData.filter(!$"title".contains("Recharge")).filter(!$"title".contains("Bill Payment"))
@larkz
larkz / .sql
Last active September 2, 2015 02:38
Hive Query to union parquet tables, and select attribute
create external table larkin_workspace.afp_flat_2015_08_19
(
created_at string,
title string,
customer_id bigint,
email string,
phone string,
remote_ip string,
subtotal int,
order_discount int,