Skip to content

Instantly share code, notes, and snippets.

@mirrornerror
Last active November 1, 2018 06:37
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save mirrornerror/c694b0316fc78868e730e7a4b5297c03 to your computer and use it in GitHub Desktop.
Save mirrornerror/c694b0316fc78868e730e7a4b5297c03 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Kaggle: Titanic: Machine Learning from Disaster \n",
"### with EarlyStopping\n",
"https://www.kaggle.com/c/titanic"
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/mirrornerror/.pyenv/versions/anaconda3-5.1.0/envs/py36/lib/python3.6/site-packages/h5py/__init__.py:36: FutureWarning: Conversion of the second argument of issubdtype from `float` to `np.floating` is deprecated. In future, it will be treated as `np.float64 == np.dtype(float).type`.\n",
" from ._conv import register_converters as _register_converters\n",
"Using TensorFlow backend.\n"
]
}
],
"source": [
"import pandas as pd\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt\n",
"%matplotlib inline\n",
"\n",
"# random seed\n",
"import tensorflow as tf\n",
"import random as rn\n",
"import os\n",
"os.environ['PYTHONHASHSEED'] = '0'\n",
"random_n = 123\n",
"np.random.seed(random_n)\n",
"rn.seed(random_n)\n",
"session_conf = tf.ConfigProto(intra_op_parallelism_threads=1, inter_op_parallelism_threads=1)\n",
"from keras import backend as K\n",
"tf.set_random_seed(random_n)\n",
"sess = tf.Session(graph=tf.get_default_graph(), config=session_conf)\n",
"K.set_session(sess)\n",
"\n",
"train = pd.read_csv('train.csv', index_col=0)\n",
"test = pd.read_csv('test.csv', index_col=0)"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Survived</th>\n",
" <th>Pclass</th>\n",
" <th>Name</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Ticket</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" </tr>\n",
" <tr>\n",
" <th>PassengerId</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>Braund, Mr. Owen Harris</td>\n",
" <td>male</td>\n",
" <td>22.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>A/5 21171</td>\n",
" <td>7.2500</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>Cumings, Mrs. John Bradley (Florence Briggs Th...</td>\n",
" <td>female</td>\n",
" <td>38.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>PC 17599</td>\n",
" <td>71.2833</td>\n",
" <td>C85</td>\n",
" <td>C</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>1</td>\n",
" <td>3</td>\n",
" <td>Heikkinen, Miss. Laina</td>\n",
" <td>female</td>\n",
" <td>26.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>STON/O2. 3101282</td>\n",
" <td>7.9250</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>Futrelle, Mrs. Jacques Heath (Lily May Peel)</td>\n",
" <td>female</td>\n",
" <td>35.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>113803</td>\n",
" <td>53.1000</td>\n",
" <td>C123</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>Allen, Mr. William Henry</td>\n",
" <td>male</td>\n",
" <td>35.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>373450</td>\n",
" <td>8.0500</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Survived Pclass \\\n",
"PassengerId \n",
"1 0 3 \n",
"2 1 1 \n",
"3 1 3 \n",
"4 1 1 \n",
"5 0 3 \n",
"\n",
" Name Sex Age \\\n",
"PassengerId \n",
"1 Braund, Mr. Owen Harris male 22.0 \n",
"2 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 \n",
"3 Heikkinen, Miss. Laina female 26.0 \n",
"4 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 \n",
"5 Allen, Mr. William Henry male 35.0 \n",
"\n",
" SibSp Parch Ticket Fare Cabin Embarked \n",
"PassengerId \n",
"1 1 0 A/5 21171 7.2500 NaN S \n",
"2 1 0 PC 17599 71.2833 C85 C \n",
"3 0 0 STON/O2. 3101282 7.9250 NaN S \n",
"4 1 0 113803 53.1000 C123 S \n",
"5 0 0 373450 8.0500 NaN S "
]
},
"execution_count": 2,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"train.head()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Drop Survived and Ticket, then combine train with test "
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.frame.DataFrame'>\n",
"Int64Index: 1309 entries, 1 to 1309\n",
"Data columns (total 9 columns):\n",
"Pclass 1309 non-null int64\n",
"Name 1309 non-null object\n",
"Sex 1309 non-null object\n",
"Age 1046 non-null float64\n",
"SibSp 1309 non-null int64\n",
"Parch 1309 non-null int64\n",
"Fare 1308 non-null float64\n",
"Cabin 295 non-null object\n",
"Embarked 1307 non-null object\n",
"dtypes: float64(2), int64(3), object(4)\n",
"memory usage: 102.3+ KB\n"
]
}
],
"source": [
"train_tmp = train.drop(['Survived', 'Ticket'], axis=1)\n",
"test_tmp = test.drop(['Ticket'], axis=1)\n",
"df = pd.concat([train_tmp, test_tmp])\n",
"df.info()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Name --> Title --> Number"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"['Mr' 'Mrs' 'Miss' 'Master' 'Don' 'Rev' 'Dr' 'Mme' 'Ms' 'Major' 'Lady'\n",
" 'Sir' 'Mlle' 'Col' 'Capt' 'Countess' 'Jonkheer' 'Dona']\n"
]
}
],
"source": [
"# Name to Title\n",
"df = df.assign(Title=df.Name.str.extract(' ([A-Za-z]+)\\..', expand=True))\n",
"title_list = df.Title.unique()\n",
"print(title_list)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Pclass</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" <th>Title</th>\n",
" </tr>\n",
" <tr>\n",
" <th>PassengerId</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>3</td>\n",
" <td>male</td>\n",
" <td>22.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>7.2500</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>1</td>\n",
" <td>female</td>\n",
" <td>38.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>71.2833</td>\n",
" <td>C85</td>\n",
" <td>C</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>3</td>\n",
" <td>female</td>\n",
" <td>26.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>7.9250</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>1</td>\n",
" <td>female</td>\n",
" <td>35.0</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>53.1000</td>\n",
" <td>C123</td>\n",
" <td>S</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>3</td>\n",
" <td>male</td>\n",
" <td>35.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>8.0500</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Pclass Sex Age SibSp Parch Fare Cabin Embarked Title\n",
"PassengerId \n",
"1 3 male 22.0 1 0 7.2500 NaN S 0\n",
"2 1 female 38.0 1 0 71.2833 C85 C 1\n",
"3 3 female 26.0 0 0 7.9250 NaN S 2\n",
"4 1 female 35.0 1 0 53.1000 C123 S 1\n",
"5 3 male 35.0 0 0 8.0500 NaN S 0"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Title to Number(0-17)\n",
"df.Title = df.Title.replace(df.Title.unique(), np.arange(len(df.Title.unique())))\n",
"\n",
"# Drop Name column\n",
"df = df.drop(['Name'], axis=1)\n",
"df.head()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Sex --> male:0, female:1"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"scrolled": true
},
"outputs": [],
"source": [
"df.Sex = df.Sex.replace({'male': 0, 'female': 1})"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Cabin --> Number: nan:0, C:1, E:2, G:3, D:4, A:5, B:6, F:7, T:8"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"[nan 'C' 'E' 'G' 'D' 'A' 'B' 'F' 'T']\n",
"[0 1 2 3 4 5 6 7 8]\n"
]
}
],
"source": [
"df = df.assign(Cabin=df.Cabin.str[0])\n",
"cabin_list = df.Cabin.unique()\n",
"\n",
"df.Cabin = df.Cabin.replace(df.Cabin.str[0].unique(), np.arange(len(df.Cabin.str[0].unique())))\n",
"\n",
"print(cabin_list)\n",
"print(df.Cabin.unique())"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Embarked --> S:0, C:1, Q:2, nan"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['S', 'C', 'Q', nan], dtype=object)"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.Embarked.unique()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [],
"source": [
"df.Embarked = df.Embarked.replace({'S':0, 'C':1, 'Q':2})"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## zscore or normalization: \n",
"* Age: including NaN\n",
"* Fare: including NaN \n",
" \n",
"Z = (x - x.mean) / x.std \n",
"N = (x - x.min) / (x.max - x.min) \n",
" \n",
"sklearn.preprocessing.MinMaxScaler causes error with Null data."
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [],
"source": [
"# Normalize Function\n",
"def normalize(df_col):\n",
" df_col = (df_col - df_col.min()) / (df_col.max() - df_col.min())\n",
" return df_col"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [],
"source": [
"# Standardization(zscore)\n",
"def zscore(df_col):\n",
" df_col = (df_col - df_col.mean()) / df_col.std()\n",
" return df_col"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Pclass</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" <th>Title</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>1309.000000</td>\n",
" <td>1309.000000</td>\n",
" <td>1.046000e+03</td>\n",
" <td>1.309000e+03</td>\n",
" <td>1.309000e+03</td>\n",
" <td>1.308000e+03</td>\n",
" <td>1309.000000</td>\n",
" <td>1307.000000</td>\n",
" <td>1.309000e+03</td>\n",
" </tr>\n",
" <tr>\n",
" <th>mean</th>\n",
" <td>2.294882</td>\n",
" <td>0.355997</td>\n",
" <td>9.488904e-17</td>\n",
" <td>2.178887e-16</td>\n",
" <td>-5.920059e-17</td>\n",
" <td>-6.049357e-16</td>\n",
" <td>0.786860</td>\n",
" <td>0.394797</td>\n",
" <td>5.343319e-17</td>\n",
" </tr>\n",
" <tr>\n",
" <th>std</th>\n",
" <td>0.837836</td>\n",
" <td>0.478997</td>\n",
" <td>1.000000e+00</td>\n",
" <td>1.000000e+00</td>\n",
" <td>1.000000e+00</td>\n",
" <td>1.000000e+00</td>\n",
" <td>1.794388</td>\n",
" <td>0.653817</td>\n",
" <td>1.000000e+00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>min</th>\n",
" <td>1.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-2.061342e+00</td>\n",
" <td>-4.789037e-01</td>\n",
" <td>-4.448295e-01</td>\n",
" <td>-6.432832e-01</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-5.418264e-01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25%</th>\n",
" <td>2.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-6.161683e-01</td>\n",
" <td>-4.789037e-01</td>\n",
" <td>-4.448295e-01</td>\n",
" <td>-4.907329e-01</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-5.418264e-01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50%</th>\n",
" <td>3.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-1.305123e-01</td>\n",
" <td>-4.789037e-01</td>\n",
" <td>-4.448295e-01</td>\n",
" <td>-3.640217e-01</td>\n",
" <td>0.000000</td>\n",
" <td>0.000000</td>\n",
" <td>-5.418264e-01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75%</th>\n",
" <td>3.000000</td>\n",
" <td>1.000000</td>\n",
" <td>6.326615e-01</td>\n",
" <td>4.811039e-01</td>\n",
" <td>-4.448295e-01</td>\n",
" <td>-3.903654e-02</td>\n",
" <td>0.000000</td>\n",
" <td>1.000000</td>\n",
" <td>6.481916e-01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>max</th>\n",
" <td>3.000000</td>\n",
" <td>1.000000</td>\n",
" <td>3.477218e+00</td>\n",
" <td>7.201157e+00</td>\n",
" <td>9.953060e+00</td>\n",
" <td>9.255140e+00</td>\n",
" <td>8.000000</td>\n",
" <td>2.000000</td>\n",
" <td>9.573327e+00</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Pclass Sex Age SibSp Parch \\\n",
"count 1309.000000 1309.000000 1.046000e+03 1.309000e+03 1.309000e+03 \n",
"mean 2.294882 0.355997 9.488904e-17 2.178887e-16 -5.920059e-17 \n",
"std 0.837836 0.478997 1.000000e+00 1.000000e+00 1.000000e+00 \n",
"min 1.000000 0.000000 -2.061342e+00 -4.789037e-01 -4.448295e-01 \n",
"25% 2.000000 0.000000 -6.161683e-01 -4.789037e-01 -4.448295e-01 \n",
"50% 3.000000 0.000000 -1.305123e-01 -4.789037e-01 -4.448295e-01 \n",
"75% 3.000000 1.000000 6.326615e-01 4.811039e-01 -4.448295e-01 \n",
"max 3.000000 1.000000 3.477218e+00 7.201157e+00 9.953060e+00 \n",
"\n",
" Fare Cabin Embarked Title \n",
"count 1.308000e+03 1309.000000 1307.000000 1.309000e+03 \n",
"mean -6.049357e-16 0.786860 0.394797 5.343319e-17 \n",
"std 1.000000e+00 1.794388 0.653817 1.000000e+00 \n",
"min -6.432832e-01 0.000000 0.000000 -5.418264e-01 \n",
"25% -4.907329e-01 0.000000 0.000000 -5.418264e-01 \n",
"50% -3.640217e-01 0.000000 0.000000 -5.418264e-01 \n",
"75% -3.903654e-02 0.000000 1.000000 6.481916e-01 \n",
"max 9.255140e+00 8.000000 2.000000 9.573327e+00 "
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.Age = zscore(df.Age)\n",
"df.Fare = zscore(df.Fare)\n",
"df.SibSp = zscore(df.SibSp)\n",
"df.Parch = zscore(df.Parch)\n",
"df.Title = zscore(df.Title)\n",
"\n",
"# df.Age = normalize(df.Age)\n",
"# df.Fare = normalize(df.Fare)\n",
"\n",
"# for col in df.columns:\n",
"# df[col] = normalize(df[col])\n",
"\n",
"df.describe()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Split the Data into Null-data and Notnull-data\n",
"\n",
"Make a Copy of df: df0 = df.copy() \n",
"* Age\n",
"* Embarked\n",
"* Fare\n"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.frame.DataFrame'>\n",
"Int64Index: 1309 entries, 1 to 1309\n",
"Data columns (total 9 columns):\n",
"Pclass 1309 non-null int64\n",
"Sex 1309 non-null int64\n",
"Age 1046 non-null float64\n",
"SibSp 1309 non-null float64\n",
"Parch 1309 non-null float64\n",
"Fare 1308 non-null float64\n",
"Cabin 1309 non-null int64\n",
"Embarked 1307 non-null float64\n",
"Title 1309 non-null float64\n",
"dtypes: float64(6), int64(3)\n",
"memory usage: 102.3 KB\n"
]
}
],
"source": [
"# Drop Cabin if the result gets better\n",
"#df = df.drop(['Cabin'], axis=1)\n",
"\n",
"df0 = df.copy()\n",
"df0.info()"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [],
"source": [
"Age_null = df[df.Age.isnull()]\n",
"df = df[df.Age.notnull()]\n",
"\n",
"Embarked_null = df[df.Embarked.isnull()]\n",
"df = df[df.Embarked.notnull()]\n",
"\n",
"Fare_null = df[df.Fare.isnull()]\n",
"df = df[df.Fare.notnull()]"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Get Notnull Data: df.shape = (1043, 9)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"(1043, 9)\n",
"<class 'pandas.core.frame.DataFrame'>\n",
"Int64Index: 1043 entries, 1 to 1307\n",
"Data columns (total 9 columns):\n",
"Pclass 1043 non-null int64\n",
"Sex 1043 non-null int64\n",
"Age 1043 non-null float64\n",
"SibSp 1043 non-null float64\n",
"Parch 1043 non-null float64\n",
"Fare 1043 non-null float64\n",
"Cabin 1043 non-null int64\n",
"Embarked 1043 non-null float64\n",
"Title 1043 non-null float64\n",
"dtypes: float64(6), int64(3)\n",
"memory usage: 81.5 KB\n"
]
}
],
"source": [
"print(df.shape)\n",
"df.info()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Model to fill NaN in Fare, Embarked, Age"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [],
"source": [
"from keras.models import Sequential\n",
"from keras.layers import Flatten, Dense, Dropout, BatchNormalization\n",
"import keras\n",
"from keras.callbacks import EarlyStopping, ModelCheckpoint, ReduceLROnPlateau\n",
"\n",
"initializer = keras.initializers.glorot_uniform(seed=random_n)\n",
"# model for Fare, Embarked, Age\n",
"def fill_data(col):\n",
" n_cols = len(df.columns) - 1\n",
" num = len(df[col].unique())\n",
" \n",
" model = Sequential()\n",
" model.add(Dense(64, activation='relu', input_shape=(n_cols,), kernel_initializer=initializer))\n",
" model.add(Dropout(0.5, seed=random_n))\n",
" \n",
" if col == 'Embarked':\n",
" model.add(Dense(num, activation='softmax', kernel_initializer=initializer))\n",
" model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['acc'])\n",
" else: # 'Fare', 'Age'\n",
" model.add(Dense(1, activation='relu', kernel_initializer=initializer))\n",
" model.compile(optimizer='adam', loss='mse', metrics=['mae'])\n",
" \n",
" data = df.drop([col], axis=1)\n",
" \n",
" reduce_lr = ReduceLROnPlateau(monitor='val_loss', factor=0.2, patience=3, min_lr=0.000001,verbose=1)\n",
" checkpointer = ModelCheckpoint(filepath='checkpoint_'+col+'.hdf5', verbose=1, save_best_only=True)\n",
" early_stopping = EarlyStopping(patience=10, verbose=1)\n",
" epochs = 300\n",
" hist = model.fit(data, df[col], \n",
" epochs=epochs, \n",
" batch_size=32,\n",
" verbose=1,\n",
" validation_split=0.1,\n",
" callbacks=[reduce_lr, early_stopping, checkpointer])\n",
"\n",
" null_data = df0[df0[col].isnull()]\n",
" null_data = null_data.drop([col], axis=1)\n",
" \n",
" model.load_weights('checkpoint_'+col+'.hdf5')\n",
" pred = model.predict(null_data)\n",
" \n",
" if col == 'Embarked':\n",
" pred = pred.argmax(axis=1)\n",
" \n",
" plt.plot(hist.history['acc'], 'b-', label='acc' )\n",
" plt.plot(hist.history['loss'], 'r-', label='loss' )\n",
" plt.xlabel('epochs')\n",
" plt.legend()\n",
" plt.show()\n",
" \n",
" pred = pred.reshape(-1, )\n",
" \n",
" idx = df0[df0[col].isnull()].index.values\n",
"\n",
" for n, i in enumerate(idx):\n",
" df0.loc[i, col] = pred[n]"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Train on 938 samples, validate on 105 samples\n",
"Epoch 1/300\n",
"938/938 [==============================] - 0s 344us/step - loss: 0.8662 - acc: 0.6205 - val_loss: 0.7452 - val_acc: 0.7524\n",
"\n",
"Epoch 00001: val_loss improved from inf to 0.74523, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 2/300\n",
"938/938 [==============================] - 0s 76us/step - loss: 0.7523 - acc: 0.7313 - val_loss: 0.7328 - val_acc: 0.7429\n",
"\n",
"Epoch 00002: val_loss improved from 0.74523 to 0.73280, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 3/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 0.7292 - acc: 0.7495 - val_loss: 0.7240 - val_acc: 0.7333\n",
"\n",
"Epoch 00003: val_loss improved from 0.73280 to 0.72398, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 4/300\n",
"938/938 [==============================] - 0s 82us/step - loss: 0.7211 - acc: 0.7441 - val_loss: 0.7141 - val_acc: 0.7333\n",
"\n",
"Epoch 00004: val_loss improved from 0.72398 to 0.71408, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 5/300\n",
"938/938 [==============================] - 0s 84us/step - loss: 0.6862 - acc: 0.7601 - val_loss: 0.7117 - val_acc: 0.7333\n",
"\n",
"Epoch 00005: val_loss improved from 0.71408 to 0.71174, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 6/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 0.6646 - acc: 0.7537 - val_loss: 0.7110 - val_acc: 0.7333\n",
"\n",
"Epoch 00006: val_loss improved from 0.71174 to 0.71097, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 7/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 0.6576 - acc: 0.7655 - val_loss: 0.7034 - val_acc: 0.7429\n",
"\n",
"Epoch 00007: val_loss improved from 0.71097 to 0.70335, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 8/300\n",
"938/938 [==============================] - 0s 69us/step - loss: 0.6594 - acc: 0.7655 - val_loss: 0.7016 - val_acc: 0.7429\n",
"\n",
"Epoch 00008: val_loss improved from 0.70335 to 0.70159, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 9/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.6650 - acc: 0.7644 - val_loss: 0.7008 - val_acc: 0.7429\n",
"\n",
"Epoch 00009: val_loss improved from 0.70159 to 0.70081, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 10/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.6344 - acc: 0.7665 - val_loss: 0.7043 - val_acc: 0.7429\n",
"\n",
"Epoch 00010: val_loss did not improve from 0.70081\n",
"Epoch 11/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 0.6337 - acc: 0.7665 - val_loss: 0.6979 - val_acc: 0.7429\n",
"\n",
"Epoch 00011: val_loss improved from 0.70081 to 0.69788, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 12/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 0.6329 - acc: 0.7601 - val_loss: 0.6970 - val_acc: 0.7429\n",
"\n",
"Epoch 00012: val_loss improved from 0.69788 to 0.69701, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 13/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 0.6176 - acc: 0.7708 - val_loss: 0.6976 - val_acc: 0.7429\n",
"\n",
"Epoch 00013: val_loss did not improve from 0.69701\n",
"Epoch 14/300\n",
"938/938 [==============================] - 0s 79us/step - loss: 0.6086 - acc: 0.7655 - val_loss: 0.6951 - val_acc: 0.7429\n",
"\n",
"Epoch 00014: val_loss improved from 0.69701 to 0.69508, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 15/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 0.6289 - acc: 0.7719 - val_loss: 0.6965 - val_acc: 0.7429\n",
"\n",
"Epoch 00015: val_loss did not improve from 0.69508\n",
"Epoch 16/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.6104 - acc: 0.7687 - val_loss: 0.6972 - val_acc: 0.7429\n",
"\n",
"Epoch 00016: val_loss did not improve from 0.69508\n",
"Epoch 17/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 0.6014 - acc: 0.7772 - val_loss: 0.6946 - val_acc: 0.7333\n",
"\n",
"Epoch 00017: val_loss improved from 0.69508 to 0.69457, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 18/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.6165 - acc: 0.7665 - val_loss: 0.6978 - val_acc: 0.7429\n",
"\n",
"Epoch 00018: val_loss did not improve from 0.69457\n",
"Epoch 19/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 0.6167 - acc: 0.7644 - val_loss: 0.6933 - val_acc: 0.7333\n",
"\n",
"Epoch 00019: val_loss improved from 0.69457 to 0.69334, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 20/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 0.6039 - acc: 0.7708 - val_loss: 0.6966 - val_acc: 0.7429\n",
"\n",
"Epoch 00020: val_loss did not improve from 0.69334\n",
"Epoch 21/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 0.6079 - acc: 0.7740 - val_loss: 0.6931 - val_acc: 0.7429\n",
"\n",
"Epoch 00021: val_loss improved from 0.69334 to 0.69311, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 22/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.6071 - acc: 0.7697 - val_loss: 0.6897 - val_acc: 0.7333\n",
"\n",
"Epoch 00022: val_loss improved from 0.69311 to 0.68972, saving model to checkpoint_Embarked.hdf5\n",
"Epoch 23/300\n",
"938/938 [==============================] - 0s 69us/step - loss: 0.6012 - acc: 0.7687 - val_loss: 0.6914 - val_acc: 0.7333\n",
"\n",
"Epoch 00023: val_loss did not improve from 0.68972\n",
"Epoch 24/300\n",
"938/938 [==============================] - 0s 77us/step - loss: 0.5974 - acc: 0.7804 - val_loss: 0.6913 - val_acc: 0.7333\n",
"\n",
"Epoch 00024: val_loss did not improve from 0.68972\n",
"Epoch 25/300\n",
"938/938 [==============================] - 0s 77us/step - loss: 0.5967 - acc: 0.7761 - val_loss: 0.6933 - val_acc: 0.7333\n",
"\n",
"Epoch 00025: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.\n",
"\n",
"Epoch 00025: val_loss did not improve from 0.68972\n",
"Epoch 26/300\n",
"938/938 [==============================] - 0s 86us/step - loss: 0.5963 - acc: 0.7751 - val_loss: 0.6924 - val_acc: 0.7333\n",
"\n",
"Epoch 00026: val_loss did not improve from 0.68972\n",
"Epoch 27/300\n",
"938/938 [==============================] - 0s 94us/step - loss: 0.5949 - acc: 0.7729 - val_loss: 0.6920 - val_acc: 0.7333\n",
"\n",
"Epoch 00027: val_loss did not improve from 0.68972\n",
"Epoch 28/300\n",
"938/938 [==============================] - 0s 79us/step - loss: 0.5952 - acc: 0.7783 - val_loss: 0.6918 - val_acc: 0.7333\n",
"\n",
"Epoch 00028: ReduceLROnPlateau reducing learning rate to 4.0000001899898055e-05.\n",
"\n",
"Epoch 00028: val_loss did not improve from 0.68972\n",
"Epoch 29/300\n",
"938/938 [==============================] - 0s 87us/step - loss: 0.6045 - acc: 0.7665 - val_loss: 0.6918 - val_acc: 0.7333\n",
"\n",
"Epoch 00029: val_loss did not improve from 0.68972\n",
"Epoch 30/300\n",
"938/938 [==============================] - 0s 83us/step - loss: 0.5944 - acc: 0.7719 - val_loss: 0.6917 - val_acc: 0.7333\n",
"\n",
"Epoch 00030: val_loss did not improve from 0.68972\n",
"Epoch 31/300\n",
"938/938 [==============================] - 0s 65us/step - loss: 0.6018 - acc: 0.7740 - val_loss: 0.6916 - val_acc: 0.7333\n",
"\n",
"Epoch 00031: ReduceLROnPlateau reducing learning rate to 8.000000525498762e-06.\n",
"\n",
"Epoch 00031: val_loss did not improve from 0.68972\n",
"Epoch 32/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 0.5872 - acc: 0.7697 - val_loss: 0.6916 - val_acc: 0.7333\n",
"\n",
"Epoch 00032: val_loss did not improve from 0.68972\n",
"Epoch 00032: early stopping\n"
]
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<matplotlib.figure.Figure at 0x7fcb4879bf28>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"fill_data('Embarked') # id:62,830"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Train on 938 samples, validate on 105 samples\n",
"Epoch 1/300\n",
"938/938 [==============================] - 0s 253us/step - loss: 8.9094 - mean_absolute_error: 2.5688 - val_loss: 5.5439 - val_mean_absolute_error: 1.9672\n",
"\n",
"Epoch 00001: val_loss improved from inf to 5.54393, saving model to checkpoint_Fare.hdf5\n",
"Epoch 2/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 4.6612 - mean_absolute_error: 1.8467 - val_loss: 3.4742 - val_mean_absolute_error: 1.4843\n",
"\n",
"Epoch 00002: val_loss improved from 5.54393 to 3.47424, saving model to checkpoint_Fare.hdf5\n",
"Epoch 3/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 2.7566 - mean_absolute_error: 1.3448 - val_loss: 2.4206 - val_mean_absolute_error: 1.1232\n",
"\n",
"Epoch 00003: val_loss improved from 3.47424 to 2.42062, saving model to checkpoint_Fare.hdf5\n",
"Epoch 4/300\n",
"938/938 [==============================] - 0s 80us/step - loss: 1.7961 - mean_absolute_error: 0.9854 - val_loss: 1.8958 - val_mean_absolute_error: 0.8475\n",
"\n",
"Epoch 00004: val_loss improved from 2.42062 to 1.89583, saving model to checkpoint_Fare.hdf5\n",
"Epoch 5/300\n",
"938/938 [==============================] - 0s 91us/step - loss: 1.3640 - mean_absolute_error: 0.7712 - val_loss: 1.7291 - val_mean_absolute_error: 0.7299\n",
"\n",
"Epoch 00005: val_loss improved from 1.89583 to 1.72906, saving model to checkpoint_Fare.hdf5\n",
"Epoch 6/300\n",
"938/938 [==============================] - 0s 96us/step - loss: 1.2310 - mean_absolute_error: 0.6862 - val_loss: 1.6974 - val_mean_absolute_error: 0.7071\n",
"\n",
"Epoch 00006: val_loss improved from 1.72906 to 1.69739, saving model to checkpoint_Fare.hdf5\n",
"Epoch 7/300\n",
"938/938 [==============================] - 0s 90us/step - loss: 1.1849 - mean_absolute_error: 0.6521 - val_loss: 1.6919 - val_mean_absolute_error: 0.7020\n",
"\n",
"Epoch 00007: val_loss improved from 1.69739 to 1.69192, saving model to checkpoint_Fare.hdf5\n",
"Epoch 8/300\n",
"938/938 [==============================] - 0s 90us/step - loss: 1.1712 - mean_absolute_error: 0.6380 - val_loss: 1.6902 - val_mean_absolute_error: 0.6990\n",
"\n",
"Epoch 00008: val_loss improved from 1.69192 to 1.69016, saving model to checkpoint_Fare.hdf5\n",
"Epoch 9/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 1.1354 - mean_absolute_error: 0.6196 - val_loss: 1.6893 - val_mean_absolute_error: 0.6972\n",
"\n",
"Epoch 00009: val_loss improved from 1.69016 to 1.68933, saving model to checkpoint_Fare.hdf5\n",
"Epoch 10/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 1.1181 - mean_absolute_error: 0.6091 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00010: val_loss improved from 1.68933 to 1.68909, saving model to checkpoint_Fare.hdf5\n",
"Epoch 11/300\n",
"938/938 [==============================] - 0s 70us/step - loss: 1.1126 - mean_absolute_error: 0.6037 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00011: val_loss did not improve from 1.68909\n",
"Epoch 12/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 1.1241 - mean_absolute_error: 0.6080 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00012: val_loss did not improve from 1.68909\n",
"Epoch 13/300\n",
"938/938 [==============================] - 0s 76us/step - loss: 1.1258 - mean_absolute_error: 0.6088 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00013: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.\n",
"\n",
"Epoch 00013: val_loss did not improve from 1.68909\n",
"Epoch 14/300\n",
"938/938 [==============================] - 0s 65us/step - loss: 1.1162 - mean_absolute_error: 0.6043 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00014: val_loss did not improve from 1.68909\n",
"Epoch 15/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 1.1207 - mean_absolute_error: 0.6061 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00015: val_loss did not improve from 1.68909\n",
"Epoch 16/300\n",
"938/938 [==============================] - 0s 76us/step - loss: 1.1153 - mean_absolute_error: 0.6049 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00016: ReduceLROnPlateau reducing learning rate to 4.0000001899898055e-05.\n",
"\n",
"Epoch 00016: val_loss did not improve from 1.68909\n",
"Epoch 17/300\n",
"938/938 [==============================] - 0s 81us/step - loss: 1.1196 - mean_absolute_error: 0.6068 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00017: val_loss did not improve from 1.68909\n",
"Epoch 18/300\n",
"938/938 [==============================] - 0s 88us/step - loss: 1.1197 - mean_absolute_error: 0.6043 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00018: val_loss did not improve from 1.68909\n",
"Epoch 19/300\n",
"938/938 [==============================] - 0s 84us/step - loss: 1.1266 - mean_absolute_error: 0.6088 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00019: ReduceLROnPlateau reducing learning rate to 8.000000525498762e-06.\n",
"\n",
"Epoch 00019: val_loss did not improve from 1.68909\n",
"Epoch 20/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 1.1196 - mean_absolute_error: 0.6043 - val_loss: 1.6891 - val_mean_absolute_error: 0.6967\n",
"\n",
"Epoch 00020: val_loss did not improve from 1.68909\n",
"Epoch 00020: early stopping\n"
]
}
],
"source": [
"fill_data('Fare') # id:1044"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Train on 938 samples, validate on 105 samples\n",
"Epoch 1/300\n",
"938/938 [==============================] - 0s 341us/step - loss: 7.6284 - mean_absolute_error: 2.3602 - val_loss: 4.4499 - val_mean_absolute_error: 1.8288\n",
"\n",
"Epoch 00001: val_loss improved from inf to 4.44989, saving model to checkpoint_Age.hdf5\n",
"Epoch 2/300\n",
"938/938 [==============================] - 0s 82us/step - loss: 3.8868 - mean_absolute_error: 1.6588 - val_loss: 2.4728 - val_mean_absolute_error: 1.3419\n",
"\n",
"Epoch 00002: val_loss improved from 4.44989 to 2.47278, saving model to checkpoint_Age.hdf5\n",
"Epoch 3/300\n",
"938/938 [==============================] - 0s 81us/step - loss: 2.2828 - mean_absolute_error: 1.2684 - val_loss: 1.5693 - val_mean_absolute_error: 1.0532\n",
"\n",
"Epoch 00003: val_loss improved from 2.47278 to 1.56933, saving model to checkpoint_Age.hdf5\n",
"Epoch 4/300\n",
"938/938 [==============================] - 0s 77us/step - loss: 1.5540 - mean_absolute_error: 1.0170 - val_loss: 1.1551 - val_mean_absolute_error: 0.8729\n",
"\n",
"Epoch 00004: val_loss improved from 1.56933 to 1.15514, saving model to checkpoint_Age.hdf5\n",
"Epoch 5/300\n",
"938/938 [==============================] - 0s 80us/step - loss: 1.1987 - mean_absolute_error: 0.8832 - val_loss: 1.0211 - val_mean_absolute_error: 0.8047\n",
"\n",
"Epoch 00005: val_loss improved from 1.15514 to 1.02112, saving model to checkpoint_Age.hdf5\n",
"Epoch 6/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 1.0803 - mean_absolute_error: 0.8229 - val_loss: 0.9843 - val_mean_absolute_error: 0.7832\n",
"\n",
"Epoch 00006: val_loss improved from 1.02112 to 0.98428, saving model to checkpoint_Age.hdf5\n",
"Epoch 7/300\n",
"938/938 [==============================] - 0s 79us/step - loss: 1.0654 - mean_absolute_error: 0.8107 - val_loss: 0.9686 - val_mean_absolute_error: 0.7786\n",
"\n",
"Epoch 00007: val_loss improved from 0.98428 to 0.96857, saving model to checkpoint_Age.hdf5\n",
"Epoch 8/300\n",
"938/938 [==============================] - 0s 82us/step - loss: 1.0416 - mean_absolute_error: 0.8012 - val_loss: 0.9594 - val_mean_absolute_error: 0.7756\n",
"\n",
"Epoch 00008: val_loss improved from 0.96857 to 0.95938, saving model to checkpoint_Age.hdf5\n",
"Epoch 9/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 1.0249 - mean_absolute_error: 0.7952 - val_loss: 0.9534 - val_mean_absolute_error: 0.7736\n",
"\n",
"Epoch 00009: val_loss improved from 0.95938 to 0.95341, saving model to checkpoint_Age.hdf5\n",
"Epoch 10/300\n",
"938/938 [==============================] - 0s 76us/step - loss: 1.0173 - mean_absolute_error: 0.7899 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00010: val_loss improved from 0.95341 to 0.95071, saving model to checkpoint_Age.hdf5\n",
"Epoch 11/300\n",
"938/938 [==============================] - 0s 80us/step - loss: 1.0108 - mean_absolute_error: 0.7877 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00011: val_loss did not improve from 0.95071\n",
"Epoch 12/300\n",
"938/938 [==============================] - 0s 80us/step - loss: 1.0022 - mean_absolute_error: 0.7844 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00012: val_loss did not improve from 0.95071\n",
"Epoch 13/300\n",
"938/938 [==============================] - 0s 75us/step - loss: 1.0092 - mean_absolute_error: 0.7845 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00013: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.\n",
"\n",
"Epoch 00013: val_loss did not improve from 0.95071\n",
"Epoch 14/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 0.9999 - mean_absolute_error: 0.7827 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00014: val_loss did not improve from 0.95071\n",
"Epoch 15/300\n",
"938/938 [==============================] - 0s 68us/step - loss: 1.0042 - mean_absolute_error: 0.7825 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00015: val_loss did not improve from 0.95071\n",
"Epoch 16/300\n",
"938/938 [==============================] - 0s 70us/step - loss: 1.0074 - mean_absolute_error: 0.7871 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00016: ReduceLROnPlateau reducing learning rate to 4.0000001899898055e-05.\n",
"\n",
"Epoch 00016: val_loss did not improve from 0.95071\n",
"Epoch 17/300\n",
"938/938 [==============================] - 0s 76us/step - loss: 1.0043 - mean_absolute_error: 0.7832 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00017: val_loss did not improve from 0.95071\n",
"Epoch 18/300\n",
"938/938 [==============================] - 0s 73us/step - loss: 1.0017 - mean_absolute_error: 0.7830 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00018: val_loss did not improve from 0.95071\n",
"Epoch 19/300\n",
"938/938 [==============================] - 0s 72us/step - loss: 1.0063 - mean_absolute_error: 0.7838 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00019: ReduceLROnPlateau reducing learning rate to 8.000000525498762e-06.\n",
"\n",
"Epoch 00019: val_loss did not improve from 0.95071\n",
"Epoch 20/300\n",
"938/938 [==============================] - 0s 74us/step - loss: 1.0131 - mean_absolute_error: 0.7872 - val_loss: 0.9507 - val_mean_absolute_error: 0.7725\n",
"\n",
"Epoch 00020: val_loss did not improve from 0.95071\n",
"Epoch 00020: early stopping\n"
]
}
],
"source": [
"fill_data('Age') # id: 6,18,20,27,29,30"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Split the Data back to Train and Test "
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Pclass</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" <th>Title</th>\n",
" </tr>\n",
" <tr>\n",
" <th>PassengerId</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>-0.546789</td>\n",
" <td>0.481104</td>\n",
" <td>-0.444829</td>\n",
" <td>-0.503210</td>\n",
" <td>0</td>\n",
" <td>0.0</td>\n",
" <td>-0.541826</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>0.563282</td>\n",
" <td>0.481104</td>\n",
" <td>-0.444829</td>\n",
" <td>0.733941</td>\n",
" <td>1</td>\n",
" <td>1.0</td>\n",
" <td>0.053183</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>-0.269271</td>\n",
" <td>-0.478904</td>\n",
" <td>-0.444829</td>\n",
" <td>-0.490169</td>\n",
" <td>0</td>\n",
" <td>0.0</td>\n",
" <td>0.648192</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>0.355144</td>\n",
" <td>0.481104</td>\n",
" <td>-0.444829</td>\n",
" <td>0.382632</td>\n",
" <td>1</td>\n",
" <td>0.0</td>\n",
" <td>0.053183</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>0.355144</td>\n",
" <td>-0.478904</td>\n",
" <td>-0.444829</td>\n",
" <td>-0.487754</td>\n",
" <td>0</td>\n",
" <td>0.0</td>\n",
" <td>-0.541826</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Pclass Sex Age SibSp Parch Fare Cabin \\\n",
"PassengerId \n",
"1 3 0 -0.546789 0.481104 -0.444829 -0.503210 0 \n",
"2 1 1 0.563282 0.481104 -0.444829 0.733941 1 \n",
"3 3 1 -0.269271 -0.478904 -0.444829 -0.490169 0 \n",
"4 1 1 0.355144 0.481104 -0.444829 0.382632 1 \n",
"5 3 0 0.355144 -0.478904 -0.444829 -0.487754 0 \n",
"\n",
" Embarked Title \n",
"PassengerId \n",
"1 0.0 -0.541826 \n",
"2 1.0 0.053183 \n",
"3 0.0 0.648192 \n",
"4 0.0 0.053183 \n",
"5 0.0 -0.541826 "
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"#df0 = df0.drop(['Title'], axis=1)\n",
"\n",
"train0 = df0[0:891].copy()\n",
"test0 = df0[891:].copy()\n",
"\n",
"train0.head()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Model to estimate Survived on Test data for submission"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Train on 712 samples, validate on 179 samples\n",
"Epoch 1/300\n",
"712/712 [==============================] - 1s 915us/step - loss: 0.6920 - acc: 0.6236 - val_loss: 0.4706 - val_acc: 0.7989\n",
"\n",
"Epoch 00001: val_loss improved from inf to 0.47056, saving model to checkpoint_final.hdf5\n",
"Epoch 2/300\n",
"712/712 [==============================] - 0s 466us/step - loss: 0.5920 - acc: 0.7233 - val_loss: 0.4519 - val_acc: 0.8045\n",
"\n",
"Epoch 00002: val_loss improved from 0.47056 to 0.45195, saving model to checkpoint_final.hdf5\n",
"Epoch 3/300\n",
"712/712 [==============================] - 0s 579us/step - loss: 0.5272 - acc: 0.7598 - val_loss: 0.4405 - val_acc: 0.7933\n",
"\n",
"Epoch 00003: val_loss improved from 0.45195 to 0.44048, saving model to checkpoint_final.hdf5\n",
"Epoch 4/300\n",
"712/712 [==============================] - 0s 495us/step - loss: 0.5220 - acc: 0.7612 - val_loss: 0.4308 - val_acc: 0.7877\n",
"\n",
"Epoch 00004: val_loss improved from 0.44048 to 0.43079, saving model to checkpoint_final.hdf5\n",
"Epoch 5/300\n",
"712/712 [==============================] - 0s 446us/step - loss: 0.5136 - acc: 0.7640 - val_loss: 0.4141 - val_acc: 0.8101\n",
"\n",
"Epoch 00005: val_loss improved from 0.43079 to 0.41408, saving model to checkpoint_final.hdf5\n",
"Epoch 6/300\n",
"712/712 [==============================] - 0s 564us/step - loss: 0.5008 - acc: 0.7921 - val_loss: 0.4178 - val_acc: 0.8156\n",
"\n",
"Epoch 00006: val_loss did not improve from 0.41408\n",
"Epoch 7/300\n",
"712/712 [==============================] - 0s 457us/step - loss: 0.4654 - acc: 0.7935 - val_loss: 0.4178 - val_acc: 0.8045\n",
"\n",
"Epoch 00007: val_loss did not improve from 0.41408\n",
"Epoch 8/300\n",
"712/712 [==============================] - 0s 456us/step - loss: 0.4761 - acc: 0.7907 - val_loss: 0.4091 - val_acc: 0.8156\n",
"\n",
"Epoch 00008: val_loss improved from 0.41408 to 0.40911, saving model to checkpoint_final.hdf5\n",
"Epoch 9/300\n",
"712/712 [==============================] - 0s 510us/step - loss: 0.4743 - acc: 0.8048 - val_loss: 0.4105 - val_acc: 0.8101\n",
"\n",
"Epoch 00009: val_loss did not improve from 0.40911\n",
"Epoch 10/300\n",
"712/712 [==============================] - 0s 450us/step - loss: 0.4678 - acc: 0.7949 - val_loss: 0.3936 - val_acc: 0.8101\n",
"\n",
"Epoch 00010: val_loss improved from 0.40911 to 0.39362, saving model to checkpoint_final.hdf5\n",
"Epoch 11/300\n",
"712/712 [==============================] - 0s 470us/step - loss: 0.4531 - acc: 0.8132 - val_loss: 0.4029 - val_acc: 0.8212\n",
"\n",
"Epoch 00011: val_loss did not improve from 0.39362\n",
"Epoch 12/300\n",
"712/712 [==============================] - 0s 483us/step - loss: 0.4576 - acc: 0.8076 - val_loss: 0.3877 - val_acc: 0.8156\n",
"\n",
"Epoch 00012: val_loss improved from 0.39362 to 0.38769, saving model to checkpoint_final.hdf5\n",
"Epoch 13/300\n",
"712/712 [==============================] - 0s 468us/step - loss: 0.4707 - acc: 0.8034 - val_loss: 0.3819 - val_acc: 0.8212\n",
"\n",
"Epoch 00013: val_loss improved from 0.38769 to 0.38185, saving model to checkpoint_final.hdf5\n",
"Epoch 14/300\n",
"712/712 [==============================] - 0s 464us/step - loss: 0.4626 - acc: 0.8034 - val_loss: 0.3824 - val_acc: 0.8212\n",
"\n",
"Epoch 00014: val_loss did not improve from 0.38185\n",
"Epoch 15/300\n",
"712/712 [==============================] - 0s 465us/step - loss: 0.4725 - acc: 0.7935 - val_loss: 0.3826 - val_acc: 0.8212\n",
"\n",
"Epoch 00015: val_loss did not improve from 0.38185\n",
"Epoch 16/300\n",
"712/712 [==============================] - 0s 458us/step - loss: 0.4554 - acc: 0.8104 - val_loss: 0.3769 - val_acc: 0.8268\n",
"\n",
"Epoch 00016: val_loss improved from 0.38185 to 0.37686, saving model to checkpoint_final.hdf5\n",
"Epoch 17/300\n",
"712/712 [==============================] - 0s 461us/step - loss: 0.4565 - acc: 0.8104 - val_loss: 0.3707 - val_acc: 0.8380\n",
"\n",
"Epoch 00017: val_loss improved from 0.37686 to 0.37075, saving model to checkpoint_final.hdf5\n",
"Epoch 18/300\n",
"712/712 [==============================] - 0s 462us/step - loss: 0.4378 - acc: 0.8132 - val_loss: 0.3780 - val_acc: 0.8324\n",
"\n",
"Epoch 00018: val_loss did not improve from 0.37075\n",
"Epoch 19/300\n",
"712/712 [==============================] - 0s 457us/step - loss: 0.4452 - acc: 0.8076 - val_loss: 0.3650 - val_acc: 0.8380\n",
"\n",
"Epoch 00019: val_loss improved from 0.37075 to 0.36499, saving model to checkpoint_final.hdf5\n",
"Epoch 20/300\n",
"712/712 [==============================] - 0s 462us/step - loss: 0.4525 - acc: 0.8076 - val_loss: 0.3754 - val_acc: 0.8436\n",
"\n",
"Epoch 00020: val_loss did not improve from 0.36499\n",
"Epoch 21/300\n",
"712/712 [==============================] - 0s 461us/step - loss: 0.4346 - acc: 0.8174 - val_loss: 0.3658 - val_acc: 0.8380\n",
"\n",
"Epoch 00021: val_loss did not improve from 0.36499\n",
"Epoch 22/300\n",
"712/712 [==============================] - 0s 456us/step - loss: 0.4429 - acc: 0.7963 - val_loss: 0.3620 - val_acc: 0.8324\n",
"\n",
"Epoch 00022: val_loss improved from 0.36499 to 0.36197, saving model to checkpoint_final.hdf5\n",
"Epoch 23/300\n",
"712/712 [==============================] - 0s 451us/step - loss: 0.4420 - acc: 0.8048 - val_loss: 0.3654 - val_acc: 0.8380\n",
"\n",
"Epoch 00023: val_loss did not improve from 0.36197\n",
"Epoch 24/300\n",
"712/712 [==============================] - 0s 459us/step - loss: 0.4237 - acc: 0.8188 - val_loss: 0.3661 - val_acc: 0.8324\n",
"\n",
"Epoch 00024: val_loss did not improve from 0.36197\n",
"Epoch 25/300\n",
"712/712 [==============================] - 0s 461us/step - loss: 0.4378 - acc: 0.8174 - val_loss: 0.3621 - val_acc: 0.8380\n",
"\n",
"Epoch 00025: ReduceLROnPlateau reducing learning rate to 0.00020000000949949026.\n",
"\n",
"Epoch 00025: val_loss did not improve from 0.36197\n",
"Epoch 26/300\n",
"712/712 [==============================] - 0s 447us/step - loss: 0.4346 - acc: 0.8132 - val_loss: 0.3625 - val_acc: 0.8380\n",
"\n",
"Epoch 00026: val_loss did not improve from 0.36197\n",
"Epoch 27/300\n",
"712/712 [==============================] - 0s 474us/step - loss: 0.4328 - acc: 0.8188 - val_loss: 0.3624 - val_acc: 0.8380\n",
"\n",
"Epoch 00027: val_loss did not improve from 0.36197\n",
"Epoch 28/300\n",
"712/712 [==============================] - 0s 460us/step - loss: 0.4285 - acc: 0.8174 - val_loss: 0.3616 - val_acc: 0.8380\n",
"\n",
"Epoch 00028: val_loss improved from 0.36197 to 0.36160, saving model to checkpoint_final.hdf5\n",
"Epoch 29/300\n",
"712/712 [==============================] - 0s 462us/step - loss: 0.4219 - acc: 0.8202 - val_loss: 0.3602 - val_acc: 0.8380\n",
"\n",
"Epoch 00029: val_loss improved from 0.36160 to 0.36017, saving model to checkpoint_final.hdf5\n",
"Epoch 30/300\n",
"712/712 [==============================] - 0s 462us/step - loss: 0.4244 - acc: 0.8188 - val_loss: 0.3642 - val_acc: 0.8324\n",
"\n",
"Epoch 00030: val_loss did not improve from 0.36017\n",
"Epoch 31/300\n",
"712/712 [==============================] - 0s 459us/step - loss: 0.4344 - acc: 0.8034 - val_loss: 0.3621 - val_acc: 0.8380\n",
"\n",
"Epoch 00031: val_loss did not improve from 0.36017\n",
"Epoch 32/300\n",
"712/712 [==============================] - 0s 469us/step - loss: 0.4240 - acc: 0.8174 - val_loss: 0.3607 - val_acc: 0.8380\n",
"\n",
"Epoch 00032: ReduceLROnPlateau reducing learning rate to 4.0000001899898055e-05.\n",
"\n",
"Epoch 00032: val_loss did not improve from 0.36017\n",
"Epoch 33/300\n",
"712/712 [==============================] - 0s 459us/step - loss: 0.4373 - acc: 0.8104 - val_loss: 0.3609 - val_acc: 0.8380\n",
"\n",
"Epoch 00033: val_loss did not improve from 0.36017\n",
"Epoch 34/300\n",
"712/712 [==============================] - 0s 485us/step - loss: 0.4190 - acc: 0.8188 - val_loss: 0.3609 - val_acc: 0.8380\n",
"\n",
"Epoch 00034: val_loss did not improve from 0.36017\n",
"Epoch 35/300\n",
"712/712 [==============================] - 0s 456us/step - loss: 0.4233 - acc: 0.8230 - val_loss: 0.3610 - val_acc: 0.8380\n",
"\n",
"Epoch 00035: ReduceLROnPlateau reducing learning rate to 8.000000525498762e-06.\n",
"\n",
"Epoch 00035: val_loss did not improve from 0.36017\n",
"Epoch 36/300\n",
"712/712 [==============================] - 0s 462us/step - loss: 0.4290 - acc: 0.8244 - val_loss: 0.3610 - val_acc: 0.8380\n",
"\n",
"Epoch 00036: val_loss did not improve from 0.36017\n",
"Epoch 37/300\n",
"712/712 [==============================] - 0s 465us/step - loss: 0.4351 - acc: 0.8146 - val_loss: 0.3610 - val_acc: 0.8380\n",
"\n",
"Epoch 00037: val_loss did not improve from 0.36017\n",
"Epoch 38/300\n",
"712/712 [==============================] - 0s 472us/step - loss: 0.4340 - acc: 0.8174 - val_loss: 0.3611 - val_acc: 0.8380\n",
"\n",
"Epoch 00038: ReduceLROnPlateau reducing learning rate to 1.6000001778593287e-06.\n",
"\n",
"Epoch 00038: val_loss did not improve from 0.36017\n",
"Epoch 39/300\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"712/712 [==============================] - 0s 448us/step - loss: 0.4410 - acc: 0.8076 - val_loss: 0.3611 - val_acc: 0.8380\n",
"\n",
"Epoch 00039: val_loss did not improve from 0.36017\n",
"Epoch 00039: early stopping\n"
]
}
],
"source": [
"df0_cols = len(df0.columns)\n",
"\n",
"model = Sequential()\n",
"model.add(Dense(64, activation='relu', input_shape=(df0_cols,), kernel_initializer=initializer))\n",
"model.add(Dropout(0.5, seed=random_n))\n",
"\n",
"model.add(Dense(2, activation='softmax', kernel_initializer=initializer))\n",
"model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['acc'])\n",
"\n",
"reduce_lr = ReduceLROnPlateau(monitor='val_loss', factor=0.2, patience=3, min_lr=0.000001,verbose=1)\n",
"checkpointer = ModelCheckpoint(filepath='checkpoint_final.hdf5', verbose=1, save_best_only=True)\n",
"early_stopping = EarlyStopping(patience=10, verbose=1)\n",
"\n",
"epochs = 300\n",
"hist = model.fit(train0, train.Survived, \n",
" epochs=epochs, \n",
" batch_size=5, \n",
" verbose=1,\n",
" validation_split=0.2,\n",
" callbacks=[reduce_lr, early_stopping, checkpointer])\n",
"\n",
"model.load_weights('checkpoint_final.hdf5')\n",
"pred = model.predict(test0)"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<matplotlib.figure.Figure at 0x7fc9b43e4828>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"# print(model.metrics_names)\n",
"plt.plot(hist.history['acc'], 'b-', label='acc' )\n",
"plt.plot(hist.history['loss'], 'r-', label='loss' )\n",
"plt.xlabel('epochs')\n",
"plt.legend()\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {
"scrolled": true
},
"outputs": [],
"source": [
"result = pred.argmax(axis=1)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Submission file:"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Diff: 0\n",
"Survived: 160\n"
]
}
],
"source": [
"# compare to the previous result\n",
"prev = pd.read_csv('submission.csv', index_col=0)\n",
"print('Diff: ', np.sum(prev.Survived.values != result))\n",
"print('Survived: ', result.sum())\n",
"\n",
"# submission data to csv file \n",
"submission = pd.DataFrame({'PassengerId': test.index, 'Survived': result})\n",
"submission.to_csv('submission.csv', index=False)"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 1,\n",
" 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1,\n",
" 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1,\n",
" 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1,\n",
" 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0,\n",
" 0, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1,\n",
" 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1,\n",
" 0, 0, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1,\n",
" 1, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1,\n",
" 0, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0,\n",
" 1, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1,\n",
" 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1,\n",
" 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0,\n",
" 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1,\n",
" 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0,\n",
" 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0,\n",
" 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0,\n",
" 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1,\n",
" 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0])"
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"result"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "py36",
"language": "python",
"name": "py36"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.4"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment