Yasuhiro Fujita muupan

## train_sac_optim.py
"""A training script of Soft Actor-Critic on OpenAI Gym Mujoco environments.

This script follows the settings of https://arxiv.org/abs/1812.05905 as much
as possible.
"""
import argparse
from distutils.version import LooseVersion
import functools
import logging
import sys

## get_krishna_probability_foundations.sh
#!/bin/sh

set -e

# Download all the pdfs
wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture1_set_theory.pdf
wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture2_Realanalysis.pdf
wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture3_cardinality.pdf
wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture4_probability_spaces.pdf
wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture5_properties%20of%20prob%20measures.pdf

## how_to_build_deepmind_lab_on_macos_mojave.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                muupan
                / how_to_build_deepmind_lab_on_macos_mojave.md
            
            
              Last active
              May 14, 2020 12:05
            
              
                How to build DeepMind Lab on macOS Mojave (as of 2019/02/01)
              
          
    How to build DeepMind Lab on macOS Mojave (as of 2019/02/01)


Clone macos branch of https://github.com/deepmind/lab


Read https://github.com/deepmind/lab/blob/macos/README.md and install dependencies.


Edit WORKSPACE to correct paths of glib_archive, sdl_system, and python_system.


For glib_archive and sdl_system, you need to specify their correct paths.


## dqn.prototxt
layers {
  name: "frames_input_layer"
  type: MEMORY_DATA
  top: "frames"
  top: "dummy1"
  memory_data_param {
    batch_size: 32
    channels: 4
    height: 84
    width: 84

## gdl-kif.vim
" A sintax file for Game Description Language (GDL) in Knowledge
" Interchange Format (KIF).
"
" Put this file in .vim/syntax/ and and add set filetype gdl-kif
" Example:
" au BufRead,BufNewFile *.kif set filetype=gdl-kif

syntax region gdlKifLineComment start=+;+ end=+$+
syntax match gdlKifArrow '<='
syntax keyword gdlKifFactRelation base init true next

## sum_arrays.py
from timeit import default_timer as timer

import chainer
from chainer import cuda
from chainer import function
import chainer.functions as F
from chainer import utils
from chainer.utils import type_check
import cupy

## gist:6120294
<item>
<name>ESC/Control+[ to EISUU mode in Terminal/MacVim</name>
<appendix>Change ESC to ESC, ESC, JIS_EISUU</appendix>
<appendix>Change Control+[ to ESC, ESC, JIS_EISUU</appendix>
<identifier>private.app_terminal_esc_with_eisuu</identifier>
<only>TERMINAL, VI</only>
<inputsource_only>JAPANESE</inputsource_only>
<autogen>--KeyToKey-- KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::JIS_EISUU</autogen>
<autogen>--KeyToKey-- KeyCode::JIS_BRACKET_LEFT, VK_CONTROL, KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::JIS_EISUU</autogen>
</item>

## gist:66b42e3a3f755b5c35d3419276c1008e
Guided Cost Learning: Deep Inverse Optimal Control via Policy Optimization
Doubly Robust Off-policy Value Evaluation for Reinforcement Learning
Dropout as a Bayesian Approximation: Representing Model Uncertainty in Deep Learning
Learning Simple Algorithms from Examples
Stability of Controllers for Gaussian Process Forward Models
Smooth Imitation Learning for Online Sequence Prediction
On the Analysis of Complex Backup Strategies in Monte Carlo Tree Search
Benchmarking Deep Reinforcement Learning for Continuous Control
Cumulative Prospect Theory Meets Reinforcement Learning: Prediction and Control
Why Most Decisions Are Easy in Tetris—And Perhaps in Other Sequential Decision Problems, As Well

## gale_shapley.py
"""
Gale-Shapley Algorithm
"""

import random

def shuffled(lst):
    tmp = lst[:]
    random.shuffle(tmp)
    return tmp

## clean_downloads.sh
#!/bin/sh

dir="$HOME/Downloads"
cd $dir

files=`ls -1`

# Set IFS (Internal Field Separator)
# See http://linux.just4fun.biz/%E9%80%86%E5%BC%95%E3%81%8D%E3%82%B7%E3%82%A7%E3%83%AB%E3%82%B9%E3%82%AF%E3%83%AA%E3%83%97%E3%83%88/%E3%82%B9%E3%83%9A%E3%83%BC%E3%82%B9%E3%81%8C%E5%90%AB%E3%81%BE%E3%82%8C%E3%82%8B%E6%96%87%E5%AD%97%E5%88%97%E3%82%921%E8%A1%8C%E3%81%A8%E3%81%97%E3%81%A6%E6%89%B1%E3%81%86%E6%96%B9%E6%B3%95.html
IFS_BACKUP=$IFS
	"""A training script of Soft Actor-Critic on OpenAI Gym Mujoco environments.

	This script follows the settings of https://arxiv.org/abs/1812.05905 as much
	as possible.
	"""
	import argparse
	from distutils.version import LooseVersion
	import functools
	import logging
	import sys
	#!/bin/sh

	set -e

	# Download all the pdfs
	wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture1_set_theory.pdf
	wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture2_Realanalysis.pdf
	wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture3_cardinality.pdf
	wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture4_probability_spaces.pdf
	wget -nc http://www.ee.iitm.ac.in/~krishnaj/EE5110_files/notes/lecture5_properties%20of%20prob%20measures.pdf
	layers {
	name: "frames_input_layer"
	type: MEMORY_DATA
	top: "frames"
	top: "dummy1"
	memory_data_param {
	batch_size: 32
	channels: 4
	height: 84
	width: 84
	" A sintax file for Game Description Language (GDL) in Knowledge
	" Interchange Format (KIF).
	"
	" Put this file in .vim/syntax/ and and add set filetype gdl-kif
	" Example:
	" au BufRead,BufNewFile *.kif set filetype=gdl-kif

	syntax region gdlKifLineComment start=+;+ end=+$+
	syntax match gdlKifArrow '<='
	syntax keyword gdlKifFactRelation base init true next
	from timeit import default_timer as timer

	import chainer
	from chainer import cuda
	from chainer import function
	import chainer.functions as F
	from chainer import utils
	from chainer.utils import type_check
	import cupy
	<item>
	<name>ESC/Control+[ to EISUU mode in Terminal/MacVim</name>
	<appendix>Change ESC to ESC, ESC, JIS_EISUU</appendix>
	<appendix>Change Control+[ to ESC, ESC, JIS_EISUU</appendix>
	<identifier>private.app_terminal_esc_with_eisuu</identifier>
	<only>TERMINAL, VI</only>
	<inputsource_only>JAPANESE</inputsource_only>
	<autogen>--KeyToKey-- KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::JIS_EISUU</autogen>
	<autogen>--KeyToKey-- KeyCode::JIS_BRACKET_LEFT, VK_CONTROL, KeyCode::ESCAPE, KeyCode::ESCAPE, KeyCode::JIS_EISUU</autogen>
	</item>
	Guided Cost Learning: Deep Inverse Optimal Control via Policy Optimization
	Doubly Robust Off-policy Value Evaluation for Reinforcement Learning
	Dropout as a Bayesian Approximation: Representing Model Uncertainty in Deep Learning
	Learning Simple Algorithms from Examples
	Stability of Controllers for Gaussian Process Forward Models
	Smooth Imitation Learning for Online Sequence Prediction
	On the Analysis of Complex Backup Strategies in Monte Carlo Tree Search
	Benchmarking Deep Reinforcement Learning for Continuous Control
	Cumulative Prospect Theory Meets Reinforcement Learning: Prediction and Control
	Why Most Decisions Are Easy in Tetris—And Perhaps in Other Sequential Decision Problems, As Well
	"""
	Gale-Shapley Algorithm
	"""

	import random

	def shuffled(lst):
	tmp = lst[:]
	random.shuffle(tmp)
	return tmp
	#!/bin/sh

	dir="$HOME/Downloads"
	cd $dir

	files=`ls -1`

	# Set IFS (Internal Field Separator)
	# See http://linux.just4fun.biz/%E9%80%86%E5%BC%95%E3%81%8D%E3%82%B7%E3%82%A7%E3%83%AB%E3%82%B9%E3%82%AF%E3%83%AA%E3%83%97%E3%83%88/%E3%82%B9%E3%83%9A%E3%83%BC%E3%82%B9%E3%81%8C%E5%90%AB%E3%81%BE%E3%82%8C%E3%82%8B%E6%96%87%E5%AD%97%E5%88%97%E3%82%921%E8%A1%8C%E3%81%A8%E3%81%97%E3%81%A6%E6%89%B1%E3%81%86%E6%96%B9%E6%B3%95.html
	IFS_BACKUP=$IFS