Skip to content

Instantly share code, notes, and snippets.

@kuranono
Created March 27, 2022 03:11
Show Gist options
  • Save kuranono/f1ce36fb7fe3535322c5455546b9d7a5 to your computer and use it in GitHub Desktop.
Save kuranono/f1ce36fb7fe3535322c5455546b9d7a5 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "b99130b9",
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import numpy as np"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "5c1f1071",
"metadata": {},
"outputs": [],
"source": [
"train_df = pd.read_csv(\"./data/train.csv\")\n",
"test_df = pd.read_csv(\"./data/test.csv\")\n",
"submission = pd.read_csv(\"./data/sample_submission.csv\")"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "6a7d0e96",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>PassengerId</th>\n",
" <th>Survived</th>\n",
" <th>Pclass</th>\n",
" <th>Name</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Ticket</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>Oconnor, Frankie</td>\n",
" <td>male</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>209245</td>\n",
" <td>27.14</td>\n",
" <td>C12239</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>Bryan, Drew</td>\n",
" <td>male</td>\n",
" <td>NaN</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>27323</td>\n",
" <td>13.35</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>Owens, Kenneth</td>\n",
" <td>male</td>\n",
" <td>0.33</td>\n",
" <td>1</td>\n",
" <td>2</td>\n",
" <td>CA 457703</td>\n",
" <td>71.29</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>Kramer, James</td>\n",
" <td>male</td>\n",
" <td>19.00</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>A. 10866</td>\n",
" <td>13.04</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>4</td>\n",
" <td>1</td>\n",
" <td>3</td>\n",
" <td>Bond, Michael</td>\n",
" <td>male</td>\n",
" <td>25.00</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>427635</td>\n",
" <td>7.76</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" PassengerId Survived Pclass Name Sex Age SibSp Parch \\\n",
"0 0 1 1 Oconnor, Frankie male NaN 2 0 \n",
"1 1 0 3 Bryan, Drew male NaN 0 0 \n",
"2 2 0 3 Owens, Kenneth male 0.33 1 2 \n",
"3 3 0 3 Kramer, James male 19.00 0 0 \n",
"4 4 1 3 Bond, Michael male 25.00 0 0 \n",
"\n",
" Ticket Fare Cabin Embarked \n",
"0 209245 27.14 C12239 S \n",
"1 27323 13.35 NaN S \n",
"2 CA 457703 71.29 NaN S \n",
"3 A. 10866 13.04 NaN S \n",
"4 427635 7.76 NaN S "
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"train_df.head()"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "a2687a1c",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>PassengerId</th>\n",
" <th>Pclass</th>\n",
" <th>Name</th>\n",
" <th>Sex</th>\n",
" <th>Age</th>\n",
" <th>SibSp</th>\n",
" <th>Parch</th>\n",
" <th>Ticket</th>\n",
" <th>Fare</th>\n",
" <th>Cabin</th>\n",
" <th>Embarked</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>100000</td>\n",
" <td>3</td>\n",
" <td>Holliday, Daniel</td>\n",
" <td>male</td>\n",
" <td>19.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>24745</td>\n",
" <td>63.01</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>100001</td>\n",
" <td>3</td>\n",
" <td>Nguyen, Lorraine</td>\n",
" <td>female</td>\n",
" <td>53.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>13264</td>\n",
" <td>5.81</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>100002</td>\n",
" <td>1</td>\n",
" <td>Harris, Heather</td>\n",
" <td>female</td>\n",
" <td>19.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>25990</td>\n",
" <td>38.91</td>\n",
" <td>B15315</td>\n",
" <td>C</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>100003</td>\n",
" <td>2</td>\n",
" <td>Larsen, Eric</td>\n",
" <td>male</td>\n",
" <td>25.0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>314011</td>\n",
" <td>12.93</td>\n",
" <td>NaN</td>\n",
" <td>S</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>100004</td>\n",
" <td>1</td>\n",
" <td>Cleary, Sarah</td>\n",
" <td>female</td>\n",
" <td>17.0</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>26203</td>\n",
" <td>26.89</td>\n",
" <td>B22515</td>\n",
" <td>C</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" PassengerId Pclass Name Sex Age SibSp Parch Ticket \\\n",
"0 100000 3 Holliday, Daniel male 19.0 0 0 24745 \n",
"1 100001 3 Nguyen, Lorraine female 53.0 0 0 13264 \n",
"2 100002 1 Harris, Heather female 19.0 0 0 25990 \n",
"3 100003 2 Larsen, Eric male 25.0 0 0 314011 \n",
"4 100004 1 Cleary, Sarah female 17.0 0 2 26203 \n",
"\n",
" Fare Cabin Embarked \n",
"0 63.01 NaN S \n",
"1 5.81 NaN S \n",
"2 38.91 B15315 C \n",
"3 12.93 NaN S \n",
"4 26.89 B22515 C "
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"test_df.head()"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "18374243",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>PassengerId</th>\n",
" <th>Survived</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>100000</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>100001</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>100002</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>100003</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>100004</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" PassengerId Survived\n",
"0 100000 1\n",
"1 100001 1\n",
"2 100002 1\n",
"3 100003 1\n",
"4 100004 1"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"submission.head()"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.11"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment