cbuntain/agreement.py

## agreement.py
#
# Author: Cody Buntain
# Date: 19 March 2020
#
# Description:
#  This code is an example of uysing the agreement package
#. in NLTK to calculate a number of agreement metrics on
#. a set of annotations. Currently, this code will work
#. with two annotators and multiple labels.
#. You can use Fleiss's Kappa or Krippendorf's Alpha if you
#. have multiple annotators.

import pandas as pd
from  nltk.metrics import agreement

# Assume this CSV has the format <tweet_id>,<label>
anno1_df = pd.read_csv("annotator_1.csv", header=None, index_col=0)
anno1_df.columns = ["label_a1"]

# Assume this CSV has the format <tweet_id>,<label>
anno2_df = pd.read_csv("annotator_2.csv", header=None, index_col=0)
anno2_df.columns = ["label_a2"]

# Join so we have a data frame of labels for each tweet ID
merged_df = anno1_df.join(anno2_df)

# We can drop rows where we don't have two labelers if we want
#. I think Krippendorf can account for missing data though, so this
#. step isn't strictly necessary if you only care about Krippendorf
labels_matched_df = merged_df.dropna()

# Reformat the data into the form AnnotationTask
#  expects.
data = []
for idx, row in labels_matched_df.iterrows():
    data.append(("a1", idx, row["label_a1"]))
    data.append(("a2", idx, row["label_a2"]))

atask = agreement.AnnotationTask(data=data)

print("Cohen's Kappa:", atask.kappa())
print("Fleiss's Kappa:", atask.multi_kappa())

# This function maps labels into a numeric space,
#. so we can rely on the ordering of labels.
def priority_distance(left_label, right_label):
    mapped_labels = {
        "Critical": 4,
        "High": 3,
        "Medium": 2,
        "Low": 1,
    }
    left_i = mapped_labels[left_label]
    right_i = mapped_labels[right_label]

    return abs(left_i - right_i)

# Create a new annotation task with the distance function
atask_2 = agreement.AnnotationTask(data=data, distance=priority_distance)
print("Krippendorf's Alpha:", atask_2.alpha())
	#
	# Author: Cody Buntain
	# Date: 19 March 2020
	#
	# Description:
	# This code is an example of uysing the agreement package
	#. in NLTK to calculate a number of agreement metrics on
	#. a set of annotations. Currently, this code will work
	#. with two annotators and multiple labels.
	#. You can use Fleiss's Kappa or Krippendorf's Alpha if you
	#. have multiple annotators.

	import pandas as pd
	from nltk.metrics import agreement

	# Assume this CSV has the format <tweet_id>,<label>
	anno1_df = pd.read_csv("annotator_1.csv", header=None, index_col=0)
	anno1_df.columns = ["label_a1"]

	# Assume this CSV has the format <tweet_id>,<label>
	anno2_df = pd.read_csv("annotator_2.csv", header=None, index_col=0)
	anno2_df.columns = ["label_a2"]

	# Join so we have a data frame of labels for each tweet ID
	merged_df = anno1_df.join(anno2_df)

	# We can drop rows where we don't have two labelers if we want
	#. I think Krippendorf can account for missing data though, so this
	#. step isn't strictly necessary if you only care about Krippendorf
	labels_matched_df = merged_df.dropna()

	# Reformat the data into the form AnnotationTask
	# expects.
	data = []
	for idx, row in labels_matched_df.iterrows():
	data.append(("a1", idx, row["label_a1"]))
	data.append(("a2", idx, row["label_a2"]))

	atask = agreement.AnnotationTask(data=data)

	print("Cohen's Kappa:", atask.kappa())
	print("Fleiss's Kappa:", atask.multi_kappa())

	# This function maps labels into a numeric space,
	#. so we can rely on the ordering of labels.
	def priority_distance(left_label, right_label):
	mapped_labels = {
	"Critical": 4,
	"High": 3,
	"Medium": 2,
	"Low": 1,
	}
	left_i = mapped_labels[left_label]
	right_i = mapped_labels[right_label]

	return abs(left_i - right_i)

	# Create a new annotation task with the distance function
	atask_2 = agreement.AnnotationTask(data=data, distance=priority_distance)
	print("Krippendorf's Alpha:", atask_2.alpha())