patternproject/anti-join vs setdiff

## anti-join vs setdiff
# The main idea comes from this post:
# http://zevross.com/blog/2014/08/05/using-the-r-function-anti_join-to-find-unmatched-records/

# Setting up
df.1 <- data.frame(
  state = rep(1:3, each=2),
  country = rep(c("A","B"),3),
  vals = rnorm(6)
)

df.2 = df.1[c(1,3,4),]

# Anti Join on 1 Parameter
anti_join(df.1,df.2, by=c("state"))

#   state country       vals
#     3       A -0.1566940
#     3       B  0.5666763

# Anti Join on 2 Parameters
anti_join(df.1,df.2, by=c("state","country"))

# state country       vals
#     1       B -0.4089718
#     3       B  0.5666763
#     3       A -0.1566940

# Anti Join on 3 or All Parameters
anti_join(df.1,df.2, by=c("state","country","vals"))
# state country       vals
#     3       B  0.5666763
#     3       A -0.1566940
#     1       B -0.4089718

setdiff(df.1,df.2)
# state country       vals
#     1       B -0.4089718
#     3       B  0.5666763
#     3       A -0.1566940

# setdiff behavior is similar to anti-join with all parameters.
	# The main idea comes from this post:
	# http://zevross.com/blog/2014/08/05/using-the-r-function-anti_join-to-find-unmatched-records/

	# Setting up
	df.1 <- data.frame(
	state = rep(1:3, each=2),
	country = rep(c("A","B"),3),
	vals = rnorm(6)
	)

	df.2 = df.1[c(1,3,4),]

	# Anti Join on 1 Parameter
	anti_join(df.1,df.2, by=c("state"))

	# state country vals
	# 3 A -0.1566940
	# 3 B 0.5666763

	# Anti Join on 2 Parameters
	anti_join(df.1,df.2, by=c("state","country"))

	# state country vals
	# 1 B -0.4089718
	# 3 B 0.5666763
	# 3 A -0.1566940

	# Anti Join on 3 or All Parameters
	anti_join(df.1,df.2, by=c("state","country","vals"))
	# state country vals
	# 3 B 0.5666763
	# 3 A -0.1566940
	# 1 B -0.4089718

	setdiff(df.1,df.2)
	# state country vals
	# 1 B -0.4089718
	# 3 B 0.5666763
	# 3 A -0.1566940

	# setdiff behavior is similar to anti-join with all parameters.