Jovi jovianlin

## my_standardscalar.py
def normalize(train, test):
    mean, std = train.mean(), test.std()
    train = (train - mean) / std
    test = (test - mean) / std
    return train, test

## plot_decision_boundary.py
# Train the logistic rgeression classifier
clf = sklearn.linear_model.LogisticRegressionCV()
clf.fit(X, y)

# Plot the decision boundary
plot_decision_boundary(lambda x: clf.predict(x))
plt.title("Logistic Regression")

## clustering_cosine_similarity_matrix.py
"""
### Problem Statement ###
Let's say you have a square matrix which consists of cosine similarities (values between 0 and 1).
This square matrix can be of any size.
You want to get clusters which maximize the values between elemnts in the cluster.
For example, for the following matrix:

  |  A  |  B  |  C  |  D
A | 1.0 | 0.1 | 0.6 |  0.4
B | 0.1 | 1.0 | 0.1 |  0.2

## fix_encoding.py
def fix_encoding(some_str):
    return ''.join([c for c in some_str if 0x20 <= ord(c) <= 0x78])


## anaconda_tensorflow.txt
# ===================================================================================
# Many thanks to:
# https://uoa-eresearch.github.io/eresearch-cookbook/recipe/2014/11/20/conda/
#
# More info:
# https://www.continuum.io/blog/developer-blog/python-packages-and-environments-conda
# https://conda-forge.github.io/#about
# ===================================================================================

# conda info --env

## fibonacci.py
from functools import lru_cache

@lru_cache(maxsize=100)
def fibonacci(n):
  # Check that the input is a positive integer
  if type(n) != int:
    raise TypeError("n must be a positive int")
  if n < 1:
    raise ValueError("n must be a positive int")


## foo.py
def foo(s):
	if len(s) <= 0:
		return None
	else:
		output, curr_char, curr_count = '', '', 0
		for idx in range(0, len(s)):
			if s[idx] == curr_char:
				curr_count += 1
			else:
				output += curr_char + str(curr_count) if curr_count > 0 else curr_char

## mini_batch_learning.py
from sklearn.linear_model import SGDRegressor

# https://adventuresindatascience.wordpress.com/2014/12/30/minibatch-learning-for-large-scale-data-using-scikit-learn/

def iter_minibatches(chunksize, numtrainingpoints):
    # Provide chunks one by one
    chunkstartmarker = 0
    while chunkstartmarker < numtrainingpoints:
        chunkrows = range(chunkstartmarker,chunkstartmarker+chunksize)
        X_chunk, y_chunk = getrows(chunkrows)

## TargetedSentimentAnalysis.py
# -*- coding: utf-8 -*-

from afinn import Afinn
import spacy
import re


class TargetedSentimentAnalysis(object):
	def __init__(self):
		self.afinn = Afinn(emoticons=True)

## test_argparse.py
import argparse
import sys

def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('--x', type=float, default=1.0,
                        help='What is the first number?')
    parser.add_argument('--y', type=float, default=1.0,
                        help='What is the second number?')
    parser.add_argument('--operation', type=str, default='add',
	def normalize(train, test):
	mean, std = train.mean(), test.std()
	train = (train - mean) / std
	test = (test - mean) / std
	return train, test
	# Train the logistic rgeression classifier
	clf = sklearn.linear_model.LogisticRegressionCV()
	clf.fit(X, y)

	# Plot the decision boundary
	plot_decision_boundary(lambda x: clf.predict(x))
	plt.title("Logistic Regression")
	"""
	### Problem Statement ###
	Let's say you have a square matrix which consists of cosine similarities (values between 0 and 1).
	This square matrix can be of any size.
	You want to get clusters which maximize the values between elemnts in the cluster.
	For example, for the following matrix:

	\| A \| B \| C \| D
	A \| 1.0 \| 0.1 \| 0.6 \| 0.4
	B \| 0.1 \| 1.0 \| 0.1 \| 0.2
	def fix_encoding(some_str):
	return ''.join([c for c in some_str if 0x20 <= ord(c) <= 0x78])
	# ===================================================================================
	# Many thanks to:
	# https://uoa-eresearch.github.io/eresearch-cookbook/recipe/2014/11/20/conda/
	#
	# More info:
	# https://www.continuum.io/blog/developer-blog/python-packages-and-environments-conda
	# https://conda-forge.github.io/#about
	# ===================================================================================

	# conda info --env
	from functools import lru_cache

	@lru_cache(maxsize=100)
	def fibonacci(n):
	# Check that the input is a positive integer
	if type(n) != int:
	raise TypeError("n must be a positive int")
	if n < 1:
	raise ValueError("n must be a positive int")
	def foo(s):
	if len(s) <= 0:
	return None
	else:
	output, curr_char, curr_count = '', '', 0
	for idx in range(0, len(s)):
	if s[idx] == curr_char:
	curr_count += 1
	else:
	output += curr_char + str(curr_count) if curr_count > 0 else curr_char
	from sklearn.linear_model import SGDRegressor

	# https://adventuresindatascience.wordpress.com/2014/12/30/minibatch-learning-for-large-scale-data-using-scikit-learn/

	def iter_minibatches(chunksize, numtrainingpoints):
	# Provide chunks one by one
	chunkstartmarker = 0
	while chunkstartmarker < numtrainingpoints:
	chunkrows = range(chunkstartmarker,chunkstartmarker+chunksize)
	X_chunk, y_chunk = getrows(chunkrows)
	# -- coding: utf-8 --

	from afinn import Afinn
	import spacy
	import re


	class TargetedSentimentAnalysis(object):
	def __init__(self):
	self.afinn = Afinn(emoticons=True)
	import argparse
	import sys

	def main():
	parser = argparse.ArgumentParser()
	parser.add_argument('--x', type=float, default=1.0,
	help='What is the first number?')
	parser.add_argument('--y', type=float, default=1.0,
	help='What is the second number?')
	parser.add_argument('--operation', type=str, default='add',