Skip to content

Instantly share code, notes, and snippets.

View yamaguchiyuto's full-sized avatar

Yuto Yamaguchi yamaguchiyuto

View GitHub Profile
@yamaguchiyuto
yamaguchiyuto / predict.py
Created February 23, 2016 23:51
Reproducing TransE experiments [NIPS'13]
import sys
import pickle
import numpy as np
import pandas as pd
from transe import TRANSE
modelfilepath = sys.argv[1]
h = sys.argv[2]
r = sys.argv[3]
import numpy as np
from scipy import linalg,sparse,random
class RESCAL:
def __init__(self,r,lamb_A,lamb_R):
self.r = r
self.lamb_A = lamb_A
self.lamb_R = lamb_R
def fit(self,X,niter=30):
@yamaguchiyuto
yamaguchiyuto / remove_usernames_and_urls.py
Last active October 9, 2015 00:50
Removing URLs and usernames in tweets
import re
def remove_usernames_and_urls(text):
username_removed_text = re.sub('@\w+', '', text) # remove usernames
return re.sub('(https?|ftp)(:\/\/[-_.!~*\'()a-zA-Z0-9;\/?:\@&=+\$,%#]+)', '', username_removed_text) # remove urls
@yamaguchiyuto
yamaguchiyuto / cross_validation.py
Created December 5, 2014 04:06
Cross validation for oreore regression
import sys
import numpy as np
from sklearn import cross_validation
from oreore_ridge import RidgeRegression
def psi(xlist,M):
""" make a design matrix """
ret = []
for x in xlist:
ret.append([x**i for i in range(0,M+1)])
@yamaguchiyuto
yamaguchiyuto / grid_search.py
Created December 5, 2014 04:06
Grid search for oreore regression
import sys
import numpy as np
import matplotlib.pyplot as plt
from sklearn import grid_search
from oreore_ridge import RidgeRegression
def psi(xlist,M):
""" make a design matrix """
ret = []
for x in xlist:
@yamaguchiyuto
yamaguchiyuto / oreore_ridge.py
Created December 5, 2014 04:04
scikit-learn-compatible Ridge Regression
import numpy as np
from sklearn.base import BaseEstimator, RegressorMixin
class RidgeRegression(BaseEstimator, RegressorMixin):
def __init__(self,lamb=1.0):
self.lamb = lamb
def fit(self,X,y):
A = np.dot(X.T,X) + self.lamb * np.identity(X.shape[1])
b = np.dot(X.T,y)
@yamaguchiyuto
yamaguchiyuto / get_precisions.py
Created December 2, 2014 15:32
LP and LS experiments
import sys
import numpy as np
import random
from sklearn import datasets
from sklearn.semi_supervised import label_propagation
from sklearn import svm
from sklearn.grid_search import ParameterGrid
def score(estimator, X, y, parameters, validation_true_labels, test_true_labels, validation_set, test_set, X_validation_for_svm=None, X_test_for_svm=None):
@yamaguchiyuto
yamaguchiyuto / digits.py
Created December 2, 2014 14:30
scikit-learn digits dataset
import matplotlib.pyplot as plt
from sklearn.datasets import load_digits
digits = load_digits()
plt.gray()
plt.matshow(digits.images[0])
plt.show()
@yamaguchiyuto
yamaguchiyuto / eigenspoke.py
Last active August 29, 2015 14:08
Plot EE-plot from edgelist [Aditya+, ICDM09]
import sys
import networkx as nx
from scipy.sparse import linalg
import matplotlib
matplotlib.use('Agg')
import matplotlib.pyplot as plt
def plot(v,name,k,n=10000):
for i in range(0,k-1):
plt.plot(v[:n,i],v[:n,i+1],'r+')
@yamaguchiyuto
yamaguchiyuto / basic_plot.py
Last active March 7, 2022 15:51
Plot degree distribution (Freq, CDF, CCDF) from edgelist data
import sys
import numpy as np
import networkx as nx
import matplotlib.pyplot as plt
def plot(data,filename,degreetype):
""" Plot Distribution """
plt.plot(range(len(data)),data,'bo')
plt.yscale('log')
plt.xscale('log')