fbrundu/fastcluster_to_k.py

## fastcluster_to_k.py
import fastcluster as fc
import pandas as pd
import scipy.cluster.hierarchy as sch

# define total number of cluster to obtain
k = 5

# define matrix path
mat_path = 'matrix.txt'

# load matrix
mat = pd.read_table(mat_path, index_col=0)

# clustering on columns?
clust_columns = True
if clust_columns:
    mat = mat.T

# define fastcluster method and metric
method = 'complete'
metric = 'cosine'

# run fastcluster
clust_total = fc.linkage(mat, method=method, metric=metric)

# crop dendrogram to k
clust = sch.fcluster(clust_total, k, criterion='maxclust')

# clust to pandas Series
clust = pd.Series(clust, index=mat.index)

# write output to file
output_path = 'clust.txt'
clust.to_csv(output_path, sep='\t')
	import fastcluster as fc
	import pandas as pd
	import scipy.cluster.hierarchy as sch

	# define total number of cluster to obtain
	k = 5

	# define matrix path
	mat_path = 'matrix.txt'

	# load matrix
	mat = pd.read_table(mat_path, index_col=0)

	# clustering on columns?
	clust_columns = True
	if clust_columns:
	mat = mat.T

	# define fastcluster method and metric
	method = 'complete'
	metric = 'cosine'

	# run fastcluster
	clust_total = fc.linkage(mat, method=method, metric=metric)

	# crop dendrogram to k
	clust = sch.fcluster(clust_total, k, criterion='maxclust')

	# clust to pandas Series
	clust = pd.Series(clust, index=mat.index)

	# write output to file
	output_path = 'clust.txt'
	clust.to_csv(output_path, sep='\t')