Skip to content

Instantly share code, notes, and snippets.

@yingminc
Created July 27, 2017 05:55
Show Gist options
  • Save yingminc/c2832a0b35d1a8831dec907a0c90c1e3 to your computer and use it in GitHub Desktop.
Save yingminc/c2832a0b35d1a8831dec907a0c90c1e3 to your computer and use it in GitHub Desktop.
load weather data from url via pandas
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# load weather data from 気象庁"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"import pandas as pd\n",
"from datetime import datetime,timedelta"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Use pandas to road data of target date from wabsite\n",
"\n",
"data: weather per 10 mintues\n",
"\n",
"observation_station: Tokyo"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"date = (2017,6,1)\n",
"##url for nerima observation\n",
"#url = 'http://www.data.jma.go.jp/obd/stats/etrn/view/10min_a1.php?prec_no=44&block_no=1002&year=%s&month=%s&day=%s&view=' %(date)\n",
"#url for tokyo observation\n",
"url = 'http://www.data.jma.go.jp/obd/stats/etrn/view/10min_s1.php?prec_no=44&block_no=47662&year=%s&month=%s&day=%s&view=' %(date)\n",
"d = pd.read_html(url)[0]\n"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Organize the header of the loaded table"
]
},
{
"cell_type": "code",
"execution_count": 206,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/yingminc/anaconda3/lib/python2.7/site-packages/ipykernel_launcher.py:1: DeprecationWarning: \n",
".ix is deprecated. Please use\n",
".loc for label based indexing or\n",
".iloc for positional indexing\n",
"\n",
"See the documentation here:\n",
"http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate_ix\n",
" \"\"\"Entry point for launching an IPython kernel.\n"
]
}
],
"source": [
"d = d.ix[2:145]\n",
"d.columns = ['時分', '現地気圧(hPa)', '海面気圧(hPa)','降水量(mm)', '気温(℃)','相対湿度(%)', '平均風速(m/s)','平均風向','最大瞬間風速(m/s)', '最大瞬間風向','日照時間(分)']"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Add data info to table"
]
},
{
"cell_type": "code",
"execution_count": 207,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style>\n",
" .dataframe thead tr:only-child th {\n",
" text-align: right;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: left;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>時分</th>\n",
" <th>現地気圧(hPa)</th>\n",
" <th>海面気圧(hPa)</th>\n",
" <th>降水量(mm)</th>\n",
" <th>気温(℃)</th>\n",
" <th>相対湿度(%)</th>\n",
" <th>平均風速(m/s)</th>\n",
" <th>平均風向</th>\n",
" <th>最大瞬間風速(m/s)</th>\n",
" <th>最大瞬間風向</th>\n",
" <th>日照時間(分)</th>\n",
" <th>year</th>\n",
" <th>month</th>\n",
" <th>day</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>00:10</td>\n",
" <td>1001.2</td>\n",
" <td>1004.0</td>\n",
" <td>--</td>\n",
" <td>21.6</td>\n",
" <td>86</td>\n",
" <td>4.6</td>\n",
" <td>南</td>\n",
" <td>9.1</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>00:20</td>\n",
" <td>1001.4</td>\n",
" <td>1004.2</td>\n",
" <td>0.0</td>\n",
" <td>22.0</td>\n",
" <td>85</td>\n",
" <td>4.5</td>\n",
" <td>南</td>\n",
" <td>8.6</td>\n",
" <td>南南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>00:30</td>\n",
" <td>1001.3</td>\n",
" <td>1004.1</td>\n",
" <td>0.0</td>\n",
" <td>22.0</td>\n",
" <td>85</td>\n",
" <td>4.6</td>\n",
" <td>南</td>\n",
" <td>8.9</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>00:40</td>\n",
" <td>1001.3</td>\n",
" <td>1004.1</td>\n",
" <td>0.0</td>\n",
" <td>22.0</td>\n",
" <td>85</td>\n",
" <td>5.0</td>\n",
" <td>南</td>\n",
" <td>9.0</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>00:50</td>\n",
" <td>1001.1</td>\n",
" <td>1003.9</td>\n",
" <td>0.0</td>\n",
" <td>21.8</td>\n",
" <td>85</td>\n",
" <td>4.4</td>\n",
" <td>南</td>\n",
" <td>8.5</td>\n",
" <td>南南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>01:00</td>\n",
" <td>1001.0</td>\n",
" <td>1003.8</td>\n",
" <td>--</td>\n",
" <td>21.7</td>\n",
" <td>86</td>\n",
" <td>4.5</td>\n",
" <td>南</td>\n",
" <td>8.3</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8</th>\n",
" <td>01:10</td>\n",
" <td>1000.9</td>\n",
" <td>1003.7</td>\n",
" <td>--</td>\n",
" <td>21.7</td>\n",
" <td>85</td>\n",
" <td>4.2</td>\n",
" <td>南</td>\n",
" <td>7.0</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>01:20</td>\n",
" <td>1000.8</td>\n",
" <td>1003.6</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>84</td>\n",
" <td>3.1</td>\n",
" <td>南</td>\n",
" <td>5.7</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>01:30</td>\n",
" <td>1000.4</td>\n",
" <td>1003.2</td>\n",
" <td>--</td>\n",
" <td>21.8</td>\n",
" <td>86</td>\n",
" <td>4.3</td>\n",
" <td>南南東</td>\n",
" <td>7.9</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11</th>\n",
" <td>01:40</td>\n",
" <td>1000.3</td>\n",
" <td>1003.1</td>\n",
" <td>--</td>\n",
" <td>21.8</td>\n",
" <td>87</td>\n",
" <td>4.2</td>\n",
" <td>南南東</td>\n",
" <td>8.1</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>12</th>\n",
" <td>01:50</td>\n",
" <td>1000.4</td>\n",
" <td>1003.2</td>\n",
" <td>--</td>\n",
" <td>21.8</td>\n",
" <td>88</td>\n",
" <td>3.3</td>\n",
" <td>南南東</td>\n",
" <td>5.8</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13</th>\n",
" <td>02:00</td>\n",
" <td>1000.0</td>\n",
" <td>1002.8</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>89</td>\n",
" <td>2.6</td>\n",
" <td>南南東</td>\n",
" <td>5.0</td>\n",
" <td>南南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14</th>\n",
" <td>02:10</td>\n",
" <td>999.7</td>\n",
" <td>1002.5</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>88</td>\n",
" <td>3.5</td>\n",
" <td>南南東</td>\n",
" <td>6.6</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15</th>\n",
" <td>02:20</td>\n",
" <td>999.6</td>\n",
" <td>1002.4</td>\n",
" <td>--</td>\n",
" <td>21.7</td>\n",
" <td>89</td>\n",
" <td>2.9</td>\n",
" <td>南南東</td>\n",
" <td>7.3</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>02:30</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>89</td>\n",
" <td>3.4</td>\n",
" <td>南南東</td>\n",
" <td>5.6</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>17</th>\n",
" <td>02:40</td>\n",
" <td>999.1</td>\n",
" <td>1001.9</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>90</td>\n",
" <td>4.0</td>\n",
" <td>南南東</td>\n",
" <td>6.4</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>18</th>\n",
" <td>02:50</td>\n",
" <td>999.3</td>\n",
" <td>1002.1</td>\n",
" <td>--</td>\n",
" <td>21.8</td>\n",
" <td>91</td>\n",
" <td>3.6</td>\n",
" <td>南</td>\n",
" <td>6.1</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>19</th>\n",
" <td>03:00</td>\n",
" <td>999.0</td>\n",
" <td>1001.8</td>\n",
" <td>--</td>\n",
" <td>21.9</td>\n",
" <td>91</td>\n",
" <td>2.7</td>\n",
" <td>南</td>\n",
" <td>5.4</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>20</th>\n",
" <td>03:10</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.0</td>\n",
" <td>21.9</td>\n",
" <td>90</td>\n",
" <td>3.2</td>\n",
" <td>南南西</td>\n",
" <td>5.7</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>21</th>\n",
" <td>03:20</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.0</td>\n",
" <td>21.4</td>\n",
" <td>92</td>\n",
" <td>4.1</td>\n",
" <td>南</td>\n",
" <td>7.7</td>\n",
" <td>南南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>03:30</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>1.5</td>\n",
" <td>20.8</td>\n",
" <td>95</td>\n",
" <td>5.0</td>\n",
" <td>南南東</td>\n",
" <td>7.9</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>03:40</td>\n",
" <td>999.5</td>\n",
" <td>1002.3</td>\n",
" <td>4.0</td>\n",
" <td>19.6</td>\n",
" <td>97</td>\n",
" <td>4.2</td>\n",
" <td>南南東</td>\n",
" <td>6.3</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>03:50</td>\n",
" <td>999.3</td>\n",
" <td>1002.1</td>\n",
" <td>5.5</td>\n",
" <td>19.4</td>\n",
" <td>99</td>\n",
" <td>2.2</td>\n",
" <td>南南東</td>\n",
" <td>3.8</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>04:00</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.0</td>\n",
" <td>19.6</td>\n",
" <td>100</td>\n",
" <td>1.7</td>\n",
" <td>南南東</td>\n",
" <td>3.9</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>04:10</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.0</td>\n",
" <td>19.9</td>\n",
" <td>100</td>\n",
" <td>2.6</td>\n",
" <td>南東</td>\n",
" <td>4.9</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>04:20</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.0</td>\n",
" <td>20.1</td>\n",
" <td>100</td>\n",
" <td>3.2</td>\n",
" <td>南東</td>\n",
" <td>6.3</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>04:30</td>\n",
" <td>999.5</td>\n",
" <td>1002.3</td>\n",
" <td>0.0</td>\n",
" <td>20.2</td>\n",
" <td>100</td>\n",
" <td>3.1</td>\n",
" <td>南南東</td>\n",
" <td>4.7</td>\n",
" <td>南</td>\n",
" <td>0.0</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>04:40</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.5</td>\n",
" <td>20.3</td>\n",
" <td>99</td>\n",
" <td>3.1</td>\n",
" <td>南</td>\n",
" <td>5.6</td>\n",
" <td>南</td>\n",
" <td>0.0</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>04:50</td>\n",
" <td>999.6</td>\n",
" <td>1002.4</td>\n",
" <td>0.0</td>\n",
" <td>20.3</td>\n",
" <td>99</td>\n",
" <td>3.4</td>\n",
" <td>南</td>\n",
" <td>6.7</td>\n",
" <td>南</td>\n",
" <td>0.0</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>31</th>\n",
" <td>05:00</td>\n",
" <td>999.4</td>\n",
" <td>1002.2</td>\n",
" <td>0.5</td>\n",
" <td>20.3</td>\n",
" <td>99</td>\n",
" <td>2.8</td>\n",
" <td>南南東</td>\n",
" <td>4.0</td>\n",
" <td>南</td>\n",
" <td>0.0</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>19:10</td>\n",
" <td>993.4</td>\n",
" <td>996.2</td>\n",
" <td>--</td>\n",
" <td>21.5</td>\n",
" <td>83</td>\n",
" <td>2.1</td>\n",
" <td>南南西</td>\n",
" <td>3.7</td>\n",
" <td>南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>19:20</td>\n",
" <td>993.4</td>\n",
" <td>996.2</td>\n",
" <td>--</td>\n",
" <td>21.2</td>\n",
" <td>82</td>\n",
" <td>1.7</td>\n",
" <td>南</td>\n",
" <td>3.0</td>\n",
" <td>南南西</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>19:30</td>\n",
" <td>993.4</td>\n",
" <td>996.2</td>\n",
" <td>--</td>\n",
" <td>20.5</td>\n",
" <td>86</td>\n",
" <td>1.3</td>\n",
" <td>南南西</td>\n",
" <td>2.2</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>119</th>\n",
" <td>19:40</td>\n",
" <td>993.5</td>\n",
" <td>996.3</td>\n",
" <td>--</td>\n",
" <td>20.4</td>\n",
" <td>89</td>\n",
" <td>1.5</td>\n",
" <td>南</td>\n",
" <td>2.4</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>120</th>\n",
" <td>19:50</td>\n",
" <td>993.6</td>\n",
" <td>996.4</td>\n",
" <td>--</td>\n",
" <td>20.5</td>\n",
" <td>89</td>\n",
" <td>2.6</td>\n",
" <td>南南東</td>\n",
" <td>3.5</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>121</th>\n",
" <td>20:00</td>\n",
" <td>993.6</td>\n",
" <td>996.4</td>\n",
" <td>--</td>\n",
" <td>20.6</td>\n",
" <td>89</td>\n",
" <td>2.8</td>\n",
" <td>南南東</td>\n",
" <td>3.7</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>20:10</td>\n",
" <td>993.8</td>\n",
" <td>996.6</td>\n",
" <td>--</td>\n",
" <td>20.6</td>\n",
" <td>92</td>\n",
" <td>2.9</td>\n",
" <td>南南東</td>\n",
" <td>4.2</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>123</th>\n",
" <td>20:20</td>\n",
" <td>993.9</td>\n",
" <td>996.7</td>\n",
" <td>--</td>\n",
" <td>20.5</td>\n",
" <td>92</td>\n",
" <td>2.7</td>\n",
" <td>南南東</td>\n",
" <td>3.9</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>124</th>\n",
" <td>20:30</td>\n",
" <td>994.0</td>\n",
" <td>996.8</td>\n",
" <td>--</td>\n",
" <td>20.4</td>\n",
" <td>93</td>\n",
" <td>1.7</td>\n",
" <td>南南東</td>\n",
" <td>2.8</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>125</th>\n",
" <td>20:40</td>\n",
" <td>994.0</td>\n",
" <td>996.8</td>\n",
" <td>--</td>\n",
" <td>20.3</td>\n",
" <td>94</td>\n",
" <td>1.7</td>\n",
" <td>南南東</td>\n",
" <td>2.4</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>126</th>\n",
" <td>20:50</td>\n",
" <td>993.9</td>\n",
" <td>996.7</td>\n",
" <td>--</td>\n",
" <td>20.1</td>\n",
" <td>95</td>\n",
" <td>1.6</td>\n",
" <td>南</td>\n",
" <td>2.2</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>127</th>\n",
" <td>21:00</td>\n",
" <td>993.9</td>\n",
" <td>996.7</td>\n",
" <td>--</td>\n",
" <td>20.1</td>\n",
" <td>96</td>\n",
" <td>2.1</td>\n",
" <td>南南東</td>\n",
" <td>2.7</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>128</th>\n",
" <td>21:10</td>\n",
" <td>994.0</td>\n",
" <td>996.8</td>\n",
" <td>--</td>\n",
" <td>20.0</td>\n",
" <td>96</td>\n",
" <td>2.0</td>\n",
" <td>南南東</td>\n",
" <td>3.1</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>129</th>\n",
" <td>21:20</td>\n",
" <td>994.0</td>\n",
" <td>996.8</td>\n",
" <td>--</td>\n",
" <td>20.0</td>\n",
" <td>97</td>\n",
" <td>2.2</td>\n",
" <td>南東</td>\n",
" <td>3.0</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>130</th>\n",
" <td>21:30</td>\n",
" <td>993.9</td>\n",
" <td>996.7</td>\n",
" <td>--</td>\n",
" <td>20.0</td>\n",
" <td>97</td>\n",
" <td>2.0</td>\n",
" <td>南東</td>\n",
" <td>3.1</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>131</th>\n",
" <td>21:40</td>\n",
" <td>993.7</td>\n",
" <td>996.5</td>\n",
" <td>--</td>\n",
" <td>20.3</td>\n",
" <td>96</td>\n",
" <td>1.6</td>\n",
" <td>南東</td>\n",
" <td>2.3</td>\n",
" <td>南</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>132</th>\n",
" <td>21:50</td>\n",
" <td>993.7</td>\n",
" <td>996.5</td>\n",
" <td>--</td>\n",
" <td>20.1</td>\n",
" <td>96</td>\n",
" <td>1.4</td>\n",
" <td>南東</td>\n",
" <td>2.5</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>133</th>\n",
" <td>22:00</td>\n",
" <td>993.5</td>\n",
" <td>996.3</td>\n",
" <td>--</td>\n",
" <td>20.1</td>\n",
" <td>97</td>\n",
" <td>1.9</td>\n",
" <td>南東</td>\n",
" <td>3.4</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>134</th>\n",
" <td>22:10</td>\n",
" <td>993.2</td>\n",
" <td>996.0</td>\n",
" <td>--</td>\n",
" <td>20.6</td>\n",
" <td>93</td>\n",
" <td>2.3</td>\n",
" <td>南東</td>\n",
" <td>3.3</td>\n",
" <td>東南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>135</th>\n",
" <td>22:20</td>\n",
" <td>993.1</td>\n",
" <td>995.9</td>\n",
" <td>--</td>\n",
" <td>20.3</td>\n",
" <td>96</td>\n",
" <td>2.1</td>\n",
" <td>南東</td>\n",
" <td>2.9</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>136</th>\n",
" <td>22:30</td>\n",
" <td>993.1</td>\n",
" <td>995.9</td>\n",
" <td>--</td>\n",
" <td>20.4</td>\n",
" <td>94</td>\n",
" <td>2.5</td>\n",
" <td>南東</td>\n",
" <td>4.2</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>137</th>\n",
" <td>22:40</td>\n",
" <td>992.9</td>\n",
" <td>995.7</td>\n",
" <td>--</td>\n",
" <td>20.2</td>\n",
" <td>96</td>\n",
" <td>2.6</td>\n",
" <td>南南東</td>\n",
" <td>4.3</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>138</th>\n",
" <td>22:50</td>\n",
" <td>992.8</td>\n",
" <td>995.6</td>\n",
" <td>--</td>\n",
" <td>20.6</td>\n",
" <td>93</td>\n",
" <td>2.9</td>\n",
" <td>南南東</td>\n",
" <td>5.2</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>139</th>\n",
" <td>23:00</td>\n",
" <td>992.8</td>\n",
" <td>995.6</td>\n",
" <td>--</td>\n",
" <td>20.8</td>\n",
" <td>91</td>\n",
" <td>3.9</td>\n",
" <td>南南東</td>\n",
" <td>5.1</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>23:10</td>\n",
" <td>992.9</td>\n",
" <td>995.7</td>\n",
" <td>--</td>\n",
" <td>20.6</td>\n",
" <td>92</td>\n",
" <td>3.0</td>\n",
" <td>南東</td>\n",
" <td>5.5</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>141</th>\n",
" <td>23:20</td>\n",
" <td>992.7</td>\n",
" <td>995.5</td>\n",
" <td>--</td>\n",
" <td>20.1</td>\n",
" <td>95</td>\n",
" <td>1.3</td>\n",
" <td>南南東</td>\n",
" <td>2.5</td>\n",
" <td>南南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>142</th>\n",
" <td>23:30</td>\n",
" <td>992.6</td>\n",
" <td>995.4</td>\n",
" <td>--</td>\n",
" <td>20.0</td>\n",
" <td>95</td>\n",
" <td>1.8</td>\n",
" <td>南東</td>\n",
" <td>2.9</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>143</th>\n",
" <td>23:40</td>\n",
" <td>992.4</td>\n",
" <td>995.2</td>\n",
" <td>--</td>\n",
" <td>19.8</td>\n",
" <td>97</td>\n",
" <td>1.8</td>\n",
" <td>南東</td>\n",
" <td>2.8</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>144</th>\n",
" <td>23:50</td>\n",
" <td>992.3</td>\n",
" <td>995.1</td>\n",
" <td>--</td>\n",
" <td>19.7</td>\n",
" <td>98</td>\n",
" <td>1.0</td>\n",
" <td>南東</td>\n",
" <td>2.1</td>\n",
" <td>南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>145</th>\n",
" <td>24:00</td>\n",
" <td>992.2</td>\n",
" <td>995.0</td>\n",
" <td>--</td>\n",
" <td>19.5</td>\n",
" <td>98</td>\n",
" <td>1.3</td>\n",
" <td>東南東</td>\n",
" <td>1.9</td>\n",
" <td>東南東</td>\n",
" <td>NaN</td>\n",
" <td>2017</td>\n",
" <td>6</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>144 rows × 14 columns</p>\n",
"</div>"
],
"text/plain": [
" 時分 現地気圧(hPa) 海面気圧(hPa) 降水量(mm) 気温(℃) 相対湿度(%) 平均風速(m/s) 平均風向 \\\n",
"2 00:10 1001.2 1004.0 -- 21.6 86 4.6 南 \n",
"3 00:20 1001.4 1004.2 0.0 22.0 85 4.5 南 \n",
"4 00:30 1001.3 1004.1 0.0 22.0 85 4.6 南 \n",
"5 00:40 1001.3 1004.1 0.0 22.0 85 5.0 南 \n",
"6 00:50 1001.1 1003.9 0.0 21.8 85 4.4 南 \n",
"7 01:00 1001.0 1003.8 -- 21.7 86 4.5 南 \n",
"8 01:10 1000.9 1003.7 -- 21.7 85 4.2 南 \n",
"9 01:20 1000.8 1003.6 -- 21.9 84 3.1 南 \n",
"10 01:30 1000.4 1003.2 -- 21.8 86 4.3 南南東 \n",
"11 01:40 1000.3 1003.1 -- 21.8 87 4.2 南南東 \n",
"12 01:50 1000.4 1003.2 -- 21.8 88 3.3 南南東 \n",
"13 02:00 1000.0 1002.8 -- 21.9 89 2.6 南南東 \n",
"14 02:10 999.7 1002.5 -- 21.9 88 3.5 南南東 \n",
"15 02:20 999.6 1002.4 -- 21.7 89 2.9 南南東 \n",
"16 02:30 999.4 1002.2 -- 21.9 89 3.4 南南東 \n",
"17 02:40 999.1 1001.9 -- 21.9 90 4.0 南南東 \n",
"18 02:50 999.3 1002.1 -- 21.8 91 3.6 南 \n",
"19 03:00 999.0 1001.8 -- 21.9 91 2.7 南 \n",
"20 03:10 999.4 1002.2 0.0 21.9 90 3.2 南南西 \n",
"21 03:20 999.4 1002.2 0.0 21.4 92 4.1 南 \n",
"22 03:30 999.4 1002.2 1.5 20.8 95 5.0 南南東 \n",
"23 03:40 999.5 1002.3 4.0 19.6 97 4.2 南南東 \n",
"24 03:50 999.3 1002.1 5.5 19.4 99 2.2 南南東 \n",
"25 04:00 999.4 1002.2 0.0 19.6 100 1.7 南南東 \n",
"26 04:10 999.4 1002.2 0.0 19.9 100 2.6 南東 \n",
"27 04:20 999.4 1002.2 0.0 20.1 100 3.2 南東 \n",
"28 04:30 999.5 1002.3 0.0 20.2 100 3.1 南南東 \n",
"29 04:40 999.4 1002.2 0.5 20.3 99 3.1 南 \n",
"30 04:50 999.6 1002.4 0.0 20.3 99 3.4 南 \n",
"31 05:00 999.4 1002.2 0.5 20.3 99 2.8 南南東 \n",
".. ... ... ... ... ... ... ... ... \n",
"116 19:10 993.4 996.2 -- 21.5 83 2.1 南南西 \n",
"117 19:20 993.4 996.2 -- 21.2 82 1.7 南 \n",
"118 19:30 993.4 996.2 -- 20.5 86 1.3 南南西 \n",
"119 19:40 993.5 996.3 -- 20.4 89 1.5 南 \n",
"120 19:50 993.6 996.4 -- 20.5 89 2.6 南南東 \n",
"121 20:00 993.6 996.4 -- 20.6 89 2.8 南南東 \n",
"122 20:10 993.8 996.6 -- 20.6 92 2.9 南南東 \n",
"123 20:20 993.9 996.7 -- 20.5 92 2.7 南南東 \n",
"124 20:30 994.0 996.8 -- 20.4 93 1.7 南南東 \n",
"125 20:40 994.0 996.8 -- 20.3 94 1.7 南南東 \n",
"126 20:50 993.9 996.7 -- 20.1 95 1.6 南 \n",
"127 21:00 993.9 996.7 -- 20.1 96 2.1 南南東 \n",
"128 21:10 994.0 996.8 -- 20.0 96 2.0 南南東 \n",
"129 21:20 994.0 996.8 -- 20.0 97 2.2 南東 \n",
"130 21:30 993.9 996.7 -- 20.0 97 2.0 南東 \n",
"131 21:40 993.7 996.5 -- 20.3 96 1.6 南東 \n",
"132 21:50 993.7 996.5 -- 20.1 96 1.4 南東 \n",
"133 22:00 993.5 996.3 -- 20.1 97 1.9 南東 \n",
"134 22:10 993.2 996.0 -- 20.6 93 2.3 南東 \n",
"135 22:20 993.1 995.9 -- 20.3 96 2.1 南東 \n",
"136 22:30 993.1 995.9 -- 20.4 94 2.5 南東 \n",
"137 22:40 992.9 995.7 -- 20.2 96 2.6 南南東 \n",
"138 22:50 992.8 995.6 -- 20.6 93 2.9 南南東 \n",
"139 23:00 992.8 995.6 -- 20.8 91 3.9 南南東 \n",
"140 23:10 992.9 995.7 -- 20.6 92 3.0 南東 \n",
"141 23:20 992.7 995.5 -- 20.1 95 1.3 南南東 \n",
"142 23:30 992.6 995.4 -- 20.0 95 1.8 南東 \n",
"143 23:40 992.4 995.2 -- 19.8 97 1.8 南東 \n",
"144 23:50 992.3 995.1 -- 19.7 98 1.0 南東 \n",
"145 24:00 992.2 995.0 -- 19.5 98 1.3 東南東 \n",
"\n",
" 最大瞬間風速(m/s) 最大瞬間風向 日照時間(分) year month day \n",
"2 9.1 南 NaN 2017 6 1 \n",
"3 8.6 南南西 NaN 2017 6 1 \n",
"4 8.9 南南東 NaN 2017 6 1 \n",
"5 9.0 南 NaN 2017 6 1 \n",
"6 8.5 南南西 NaN 2017 6 1 \n",
"7 8.3 南南東 NaN 2017 6 1 \n",
"8 7.0 南 NaN 2017 6 1 \n",
"9 5.7 南 NaN 2017 6 1 \n",
"10 7.9 南南東 NaN 2017 6 1 \n",
"11 8.1 南南東 NaN 2017 6 1 \n",
"12 5.8 南南東 NaN 2017 6 1 \n",
"13 5.0 南南西 NaN 2017 6 1 \n",
"14 6.6 南 NaN 2017 6 1 \n",
"15 7.3 南南東 NaN 2017 6 1 \n",
"16 5.6 南南東 NaN 2017 6 1 \n",
"17 6.4 南南東 NaN 2017 6 1 \n",
"18 6.1 南 NaN 2017 6 1 \n",
"19 5.4 南南東 NaN 2017 6 1 \n",
"20 5.7 南 NaN 2017 6 1 \n",
"21 7.7 南南西 NaN 2017 6 1 \n",
"22 7.9 南南東 NaN 2017 6 1 \n",
"23 6.3 南 NaN 2017 6 1 \n",
"24 3.8 南南東 NaN 2017 6 1 \n",
"25 3.9 南 NaN 2017 6 1 \n",
"26 4.9 南南東 NaN 2017 6 1 \n",
"27 6.3 南東 NaN 2017 6 1 \n",
"28 4.7 南 0.0 2017 6 1 \n",
"29 5.6 南 0.0 2017 6 1 \n",
"30 6.7 南 0.0 2017 6 1 \n",
"31 4.0 南 0.0 2017 6 1 \n",
".. ... ... ... ... ... ... \n",
"116 3.7 南西 NaN 2017 6 1 \n",
"117 3.0 南南西 NaN 2017 6 1 \n",
"118 2.2 南 NaN 2017 6 1 \n",
"119 2.4 南 NaN 2017 6 1 \n",
"120 3.5 南南東 NaN 2017 6 1 \n",
"121 3.7 南南東 NaN 2017 6 1 \n",
"122 4.2 南南東 NaN 2017 6 1 \n",
"123 3.9 南南東 NaN 2017 6 1 \n",
"124 2.8 南南東 NaN 2017 6 1 \n",
"125 2.4 南南東 NaN 2017 6 1 \n",
"126 2.2 南 NaN 2017 6 1 \n",
"127 2.7 南南東 NaN 2017 6 1 \n",
"128 3.1 南東 NaN 2017 6 1 \n",
"129 3.0 南南東 NaN 2017 6 1 \n",
"130 3.1 南東 NaN 2017 6 1 \n",
"131 2.3 南 NaN 2017 6 1 \n",
"132 2.5 南南東 NaN 2017 6 1 \n",
"133 3.4 南東 NaN 2017 6 1 \n",
"134 3.3 東南東 NaN 2017 6 1 \n",
"135 2.9 南東 NaN 2017 6 1 \n",
"136 4.2 南東 NaN 2017 6 1 \n",
"137 4.3 南南東 NaN 2017 6 1 \n",
"138 5.2 南南東 NaN 2017 6 1 \n",
"139 5.1 南南東 NaN 2017 6 1 \n",
"140 5.5 南南東 NaN 2017 6 1 \n",
"141 2.5 南南東 NaN 2017 6 1 \n",
"142 2.9 南東 NaN 2017 6 1 \n",
"143 2.8 南東 NaN 2017 6 1 \n",
"144 2.1 南東 NaN 2017 6 1 \n",
"145 1.9 東南東 NaN 2017 6 1 \n",
"\n",
"[144 rows x 14 columns]"
]
},
"execution_count": 207,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"d['year'], d['month'], d['day']=date \n",
"d"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Get all dates in the target period\n",
"From 2004 to 2016"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"d1 = datetime(2004, 1,1)\n",
"d2 = datetime(2016,12,31)\n",
"\n",
"delta = d2-d1"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"4749\n"
]
}
],
"source": [
"span = []\n",
"for i in range(delta.days+1):\n",
" intdate = map(int, str(d1+timedelta(days=i)).split(' ')[0].split('-'))\n",
" span.append(intdate)\n",
"print len(span)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"(2004, 1, 1)\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/yingminc/anaconda3/lib/python2.7/site-packages/ipykernel_launcher.py:7: DeprecationWarning: \n",
".ix is deprecated. Please use\n",
".loc for label based indexing or\n",
".iloc for positional indexing\n",
"\n",
"See the documentation here:\n",
"http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate_ix\n",
" import sys\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"(2004, 1, 2)\n",
"(2004, 1, 3)\n",
"(2004, 1, 4)\n",
"(2004, 1, 5)\n",
"(2004, 1, 6)\n",
"(2004, 1, 7)\n",
"(2004, 1, 8)\n",
"(2004, 1, 9)\n",
"(2004, 1, 10)\n",
"(2004, 1, 11)\n",
"(2004, 1, 12)\n",
"(2004, 1, 13)\n",
"(2004, 1, 14)\n",
"(2004, 1, 15)\n",
"(2004, 1, 16)\n",
"(2004, 1, 17)\n",
"(2004, 1, 18)\n",
"(2004, 1, 19)\n"
]
},
{
"ename": "KeyboardInterrupt",
"evalue": "",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m<ipython-input-12-439611222f01>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[1;32m 4\u001b[0m \u001b[0;32mprint\u001b[0m \u001b[0mdate\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5\u001b[0m \u001b[0murl\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m'http://www.data.jma.go.jp/obd/stats/etrn/view/10min_a1.php?prec_no=44&block_no=1002&year=%s&month=%s&day=%s&view='\u001b[0m \u001b[0;34m%\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdate\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 6\u001b[0;31m \u001b[0md\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_html\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0murl\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 7\u001b[0m \u001b[0md\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0md\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mix\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;36m145\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 8\u001b[0m \u001b[0md\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'year'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0md\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'month'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0md\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'day'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdate\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/pandas/io/html.pyc\u001b[0m in \u001b[0;36mread_html\u001b[0;34m(io, match, flavor, header, index_col, skiprows, attrs, parse_dates, tupleize_cols, thousands, encoding, decimal, converters, na_values, keep_default_na)\u001b[0m\n\u001b[1;32m 904\u001b[0m \u001b[0mthousands\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mthousands\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mattrs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mattrs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mencoding\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mencoding\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 905\u001b[0m \u001b[0mdecimal\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdecimal\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mconverters\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mconverters\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mna_values\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mna_values\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 906\u001b[0;31m keep_default_na=keep_default_na)\n\u001b[0m",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/pandas/io/html.pyc\u001b[0m in \u001b[0;36m_parse\u001b[0;34m(flavor, io, match, attrs, encoding, **kwargs)\u001b[0m\n\u001b[1;32m 735\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 736\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 737\u001b[0;31m \u001b[0mtables\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparse_tables\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 738\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0mcaught\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 739\u001b[0m \u001b[0mretained\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcaught\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/pandas/io/html.pyc\u001b[0m in \u001b[0;36mparse_tables\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 195\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 196\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mparse_tables\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 197\u001b[0;31m \u001b[0mtables\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_parse_tables\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_build_doc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmatch\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mattrs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 198\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_build_table\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtable\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mtable\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 199\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/pandas/io/html.pyc\u001b[0m in \u001b[0;36m_build_doc\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 453\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0mbs4\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mBeautifulSoup\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 454\u001b[0m return BeautifulSoup(self._setup_build_doc(), features='html5lib',\n\u001b[0;32m--> 455\u001b[0;31m from_encoding=self.encoding)\n\u001b[0m\u001b[1;32m 456\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 457\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/bs4/__init__.pyc\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, markup, features, builder, parse_only, from_encoding, exclude_encodings, **kwargs)\u001b[0m\n\u001b[1;32m 226\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreset\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 227\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 228\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_feed\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 229\u001b[0m \u001b[0;32mbreak\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 230\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mParserRejectedMarkup\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/bs4/__init__.pyc\u001b[0m in \u001b[0;36m_feed\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 287\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbuilder\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreset\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 288\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 289\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbuilder\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfeed\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmarkup\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 290\u001b[0m \u001b[0;31m# Close out any unfinished strings and close all the open tags.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 291\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mendData\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/bs4/builder/_html5lib.pyc\u001b[0m in \u001b[0;36mfeed\u001b[0;34m(self, markup)\u001b[0m\n\u001b[1;32m 70\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 71\u001b[0m \u001b[0mextra_kwargs\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'encoding'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0muser_specified_encoding\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 72\u001b[0;31m \u001b[0mdoc\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mparser\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparse\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmarkup\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mextra_kwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 73\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[0;31m# Set the character encoding detected by the tokenizer.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/html5lib/html5parser.pyc\u001b[0m in \u001b[0;36mparse\u001b[0;34m(self, stream, encoding, parseMeta, useChardet)\u001b[0m\n\u001b[1;32m 222\u001b[0m \"\"\"\n\u001b[1;32m 223\u001b[0m self._parse(stream, innerHTML=False, encoding=encoding,\n\u001b[0;32m--> 224\u001b[0;31m parseMeta=parseMeta, useChardet=useChardet)\n\u001b[0m\u001b[1;32m 225\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtree\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgetDocument\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 226\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/html5lib/html5parser.pyc\u001b[0m in \u001b[0;36m_parse\u001b[0;34m(self, stream, innerHTML, container, encoding, parseMeta, useChardet, **kwargs)\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[0;32mwhile\u001b[0m \u001b[0mTrue\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 92\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 93\u001b[0;31m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmainLoop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 94\u001b[0m \u001b[0;32mbreak\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 95\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mReparseException\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/html5lib/html5parser.pyc\u001b[0m in \u001b[0;36mmainLoop\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 152\u001b[0m \u001b[0mParseErrorToken\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtokenTypes\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"ParseError\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 153\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 154\u001b[0;31m \u001b[0;32mfor\u001b[0m \u001b[0mtoken\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnormalizedTokens\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 155\u001b[0m \u001b[0mnew_token\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtoken\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 156\u001b[0m \u001b[0;32mwhile\u001b[0m \u001b[0mnew_token\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/html5lib/html5parser.pyc\u001b[0m in \u001b[0;36mnormalizedTokens\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 209\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mnormalizedTokens\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 210\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mtoken\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtokenizer\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 211\u001b[0;31m \u001b[0;32myield\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnormalizeToken\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtoken\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 212\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 213\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mparse\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstream\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mencoding\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mNone\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparseMeta\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0museChardet\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/home/yingminc/anaconda3/lib/python2.7/site-packages/html5lib/html5parser.pyc\u001b[0m in \u001b[0;36mnormalizeToken\u001b[0;34m(self, token)\u001b[0m\n\u001b[1;32m 252\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 253\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mtoken\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"type\"\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0mtokenTypes\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"StartTag\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 254\u001b[0;31m \u001b[0mtoken\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"data\"\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtoken\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"data\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m-\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 255\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 256\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mtoken\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;31mKeyboardInterrupt\u001b[0m: "
]
}
],
"source": [
"frames =[]\n",
"for day in span:\n",
" date = (day[0],day[1],day[2])\n",
" print date\n",
" url = 'http://www.data.jma.go.jp/obd/stats/etrn/view/10min_a1.php?prec_no=44&block_no=1002&year=%s&month=%s&day=%s&view=' %(date)\n",
" d = pd.read_html(url)[0]\n",
" d = d.ix[2:145]\n",
" d['year'], d['month'], d['day']=date\n",
" frames.append(d)\n",
"\n",
"total = pd.concat(frames)\n",
"hd = ['時分', '降水量(mm)', '気温(℃)', '平均風速(m/s)','平均風向','最大瞬間風速(m/s)', '最大瞬間風向','日照時間(分)','year','month','day']\n",
"hd_utf = [i.decode('utf-8') for i in hd]\n",
"total.columns= hd_utf\n",
"total['location'] = '練馬'.decode('utf-8')\n",
"\n",
"total.to_csv('total_weather.csv', index= False, header = True , encoding = 'utf-8')\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 2",
"language": "python",
"name": "python2"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 2
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython2",
"version": "2.7.13"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment