Dmitry Persiyanov persiyanov

## masked_matmul.py
import torch
import torch.autograd


class MaskedSpMatmul(torch.autograd.Function):
	CHUNK_SIZE = 10000

	@staticmethod
	def forward(ctx, a, b, mask):
		"""

## results.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                persiyanov
                / results.md
            
            
              Last active
              June 22, 2018 12:25
            
              
                Word2Vec benchmark without _job_producer with CythonLineSentence
              
          
    ----- MODEL "cython-linesentence-word2vec-window-05-workers-01-size-300" RESULTS -----
       * Vocab time: 126.159779072 sec.
       * Total epoch time: 1181.82512498 sec.
       * Processing speed: 144372.118509 words/sec
       * Avg CPU loads: 0.14, 0.35, 5.27, 94.53, 0.09, 0.23, 0.01, 0.02, 0.02, 0.02, 0.02, 0.01, 0.02, 0.02, 0.33, 0.02
       * Sum CPU load: 101.11282
----- MODEL "cython-linesentence-word2vec-window-05-workers-04-size-300" RESULTS -----
       * Vocab time: 126.206352949 sec.
       * Total epoch time: 305.442888975 sec.


## python_memmap.py
#!/usr/bin/env python
# -*- coding: utf-8 -*-
#
# Copyright (C) 2010 Radim Rehurek <radimrehurek@seznam.cz>
# Licensed under the GNU LGPL v2.1 - http://www.gnu.org/licenses/lgpl.html


"""Corpus in the Matrix Market format.

This code uses python's struct library to read/write binary data

## gan.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                persiyanov
                / gan.ipynb
            
            
              Created
              January 4, 2017 14:34
            
              
                MNIST GAN
              
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## gan.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                persiyanov
                / gan.ipynb
            
            
              Last active
              December 30, 2016 16:00
            
              
                Original GAN on MNIST
              
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## loadsavelasagne.py
# Optionally, you could now dump the network weights to a file like this:
np.savez('model.npz', *lasagne.layers.get_all_param_values(network))
#
# And load them again later on like this:
with np.load('model.npz') as f:
    param_values = [f['arr_%d' % i] for i in range(len(f.files))]
lasagne.layers.set_all_param_values(network, param_values)

## frozenlake.py
import gym
import numpy as np

DISCOUNT = 1.0
STEP_REWARD = 0.0
LOSE_REWARD = 0.0
WIN_REWARD = 1.0

def avg_reward(env, s, a):
    avg_reward = 0

## BagOfWordsModel.py
import pandas as pd
from sklearn.feature_extraction.text import CountVectorizer
import logging


class BagOfWordsModel(object):
    OUT_FOLDER = 'out'

    def __init__(self, id_document_dict, max_features=None, max_df=1.0):
        """Builds bow model.

## Playing Atari with Deep Reinforcement Learning (OpenAI Gym).ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                persiyanov
                / Playing Atari with Deep Reinforcement Learning (OpenAI Gym).ipynb
            
            
              Created
              May 26, 2016 14:49
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## howto.md

      
              1 file
            
          
              6 forks
            
          
              4 comments
            
          
              21 stars
            
          
                persiyanov
                / howto.md
            
            
              Last active
              October 21, 2021 15:35
            
              
                How-to get Amazon EC2 instance and do machine learning on it. Jupyter 4.0.6 server and Python 2.7.
              
          
    Goal

Want to move computation on machine with much power.
We will set up Anaconda 4.0.0 and XGBoost 0.4 (it is tricky installable).
Preliminaries


Amazon AWS Educate gives 100$ for MIPT students.
GitHub Students Pack additionaly gives 15$.

Let's start

AWS Console and launching EC2 Instance.
	import torch
	import torch.autograd


	class MaskedSpMatmul(torch.autograd.Function):
	CHUNK_SIZE = 10000

	@staticmethod
	def forward(ctx, a, b, mask):
	"""
	#!/usr/bin/env python
	# -- coding: utf-8 --
	#
	# Copyright (C) 2010 Radim Rehurek <radimrehurek@seznam.cz>
	# Licensed under the GNU LGPL v2.1 - http://www.gnu.org/licenses/lgpl.html


	"""Corpus in the Matrix Market format.

	This code uses python's struct library to read/write binary data
	# Optionally, you could now dump the network weights to a file like this:
	np.savez('model.npz', *lasagne.layers.get_all_param_values(network))
	#
	# And load them again later on like this:
	with np.load('model.npz') as f:
	param_values = [f['arr_%d' % i] for i in range(len(f.files))]
	lasagne.layers.set_all_param_values(network, param_values)
	import gym
	import numpy as np

	DISCOUNT = 1.0
	STEP_REWARD = 0.0
	LOSE_REWARD = 0.0
	WIN_REWARD = 1.0

	def avg_reward(env, s, a):
	avg_reward = 0
	import pandas as pd
	from sklearn.feature_extraction.text import CountVectorizer
	import logging


	class BagOfWordsModel(object):
	OUT_FOLDER = 'out'

	def __init__(self, id_document_dict, max_features=None, max_df=1.0):
	"""Builds bow model.