Skip to content

Instantly share code, notes, and snippets.

@decisionstats
Created December 17, 2015 02:01
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save decisionstats/01fc540363f1081c5358 to your computer and use it in GitHub Desktop.
Save decisionstats/01fc540363f1081c5358 to your computer and use it in GitHub Desktop.
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"- Import Package \n",
"We import the pandas package with the alias pd\n",
"- Import Data\n",
"We import the Boston Dataset from \n",
"- Select Data by Row number\n",
"- Select Data by Column Name\n",
"- Select Data by Row and Column\n",
"- Select Data by Condition"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"collapsed": false
},
"outputs": [],
"source": [
"Boston =pd.read_csv(\"http://vincentarelbundock.github.io/Rdatasets/csv/MASS/Boston.csv\")"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Unnamed: 0</th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>1</td>\n",
" <td>0.00632</td>\n",
" <td>18</td>\n",
" <td>2.31</td>\n",
" <td>0</td>\n",
" <td>0.538</td>\n",
" <td>6.575</td>\n",
" <td>65.2</td>\n",
" <td>4.0900</td>\n",
" <td>1</td>\n",
" <td>296</td>\n",
" <td>15.3</td>\n",
" <td>396.90</td>\n",
" <td>4.98</td>\n",
" <td>24.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>2</td>\n",
" <td>0.02731</td>\n",
" <td>0</td>\n",
" <td>7.07</td>\n",
" <td>0</td>\n",
" <td>0.469</td>\n",
" <td>6.421</td>\n",
" <td>78.9</td>\n",
" <td>4.9671</td>\n",
" <td>2</td>\n",
" <td>242</td>\n",
" <td>17.8</td>\n",
" <td>396.90</td>\n",
" <td>9.14</td>\n",
" <td>21.6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>3</td>\n",
" <td>0.02729</td>\n",
" <td>0</td>\n",
" <td>7.07</td>\n",
" <td>0</td>\n",
" <td>0.469</td>\n",
" <td>7.185</td>\n",
" <td>61.1</td>\n",
" <td>4.9671</td>\n",
" <td>2</td>\n",
" <td>242</td>\n",
" <td>17.8</td>\n",
" <td>392.83</td>\n",
" <td>4.03</td>\n",
" <td>34.7</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>4</td>\n",
" <td>0.03237</td>\n",
" <td>0</td>\n",
" <td>2.18</td>\n",
" <td>0</td>\n",
" <td>0.458</td>\n",
" <td>6.998</td>\n",
" <td>45.8</td>\n",
" <td>6.0622</td>\n",
" <td>3</td>\n",
" <td>222</td>\n",
" <td>18.7</td>\n",
" <td>394.63</td>\n",
" <td>2.94</td>\n",
" <td>33.4</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>5</td>\n",
" <td>0.06905</td>\n",
" <td>0</td>\n",
" <td>2.18</td>\n",
" <td>0</td>\n",
" <td>0.458</td>\n",
" <td>7.147</td>\n",
" <td>54.2</td>\n",
" <td>6.0622</td>\n",
" <td>3</td>\n",
" <td>222</td>\n",
" <td>18.7</td>\n",
" <td>396.90</td>\n",
" <td>5.33</td>\n",
" <td>36.2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Unnamed: 0 crim zn indus chas nox rm age dis rad tax \\\n",
"0 1 0.00632 18 2.31 0 0.538 6.575 65.2 4.0900 1 296 \n",
"1 2 0.02731 0 7.07 0 0.469 6.421 78.9 4.9671 2 242 \n",
"2 3 0.02729 0 7.07 0 0.469 7.185 61.1 4.9671 2 242 \n",
"3 4 0.03237 0 2.18 0 0.458 6.998 45.8 6.0622 3 222 \n",
"4 5 0.06905 0 2.18 0 0.458 7.147 54.2 6.0622 3 222 \n",
"\n",
" ptratio black lstat medv \n",
"0 15.3 396.90 4.98 24.0 \n",
"1 17.8 396.90 9.14 21.6 \n",
"2 17.8 392.83 4.03 34.7 \n",
"3 18.7 394.63 2.94 33.4 \n",
"4 18.7 396.90 5.33 36.2 "
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.head(5) #Gives first few rows. In R we typically use head(object) while in Python we would use object.head()"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {
"collapsed": false
},
"outputs": [],
"source": [
"Boston=Boston.drop('Unnamed: 0', 1) #Dropping a particular variable"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"crim float64\n",
"zn float64\n",
"indus float64\n",
"chas int64\n",
"nox float64\n",
"rm float64\n",
"age float64\n",
"dis float64\n",
"rad int64\n",
"tax int64\n",
"ptratio float64\n",
"black float64\n",
"lstat float64\n",
"medv float64\n",
"dtype: object"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.dtypes"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {
"collapsed": false
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.frame.DataFrame'>\n",
"Int64Index: 506 entries, 0 to 505\n",
"Data columns (total 14 columns):\n",
"crim 506 non-null float64\n",
"zn 506 non-null float64\n",
"indus 506 non-null float64\n",
"chas 506 non-null int64\n",
"nox 506 non-null float64\n",
"rm 506 non-null float64\n",
"age 506 non-null float64\n",
"dis 506 non-null float64\n",
"rad 506 non-null int64\n",
"tax 506 non-null int64\n",
"ptratio 506 non-null float64\n",
"black 506 non-null float64\n",
"lstat 506 non-null float64\n",
"medv 506 non-null float64\n",
"dtypes: float64(11), int64(3)\n",
"memory usage: 59.3 KB\n"
]
}
],
"source": [
"Boston.info()# Gives information of object. In R this is given by str"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"pandas.core.frame.DataFrame"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"type(Boston) #Gives type of object. In R this is given by class"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"(506, 14)"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.shape #Gives rows and columns. In R this is given by dim"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"['T',\n",
" '_AXIS_ALIASES',\n",
" '_AXIS_IALIASES',\n",
" '_AXIS_LEN',\n",
" '_AXIS_NAMES',\n",
" '_AXIS_NUMBERS',\n",
" '_AXIS_ORDERS',\n",
" '_AXIS_REVERSED',\n",
" '_AXIS_SLICEMAP',\n",
" '__abs__',\n",
" '__add__',\n",
" '__and__',\n",
" '__array__',\n",
" '__array_wrap__',\n",
" '__bool__',\n",
" '__bytes__',\n",
" '__class__',\n",
" '__contains__',\n",
" '__delattr__',\n",
" '__delitem__',\n",
" '__dict__',\n",
" '__dir__',\n",
" '__div__',\n",
" '__doc__',\n",
" '__eq__',\n",
" '__finalize__',\n",
" '__floordiv__',\n",
" '__format__',\n",
" '__ge__',\n",
" '__getattr__',\n",
" '__getattribute__',\n",
" '__getitem__',\n",
" '__getstate__',\n",
" '__gt__',\n",
" '__hash__',\n",
" '__iadd__',\n",
" '__imul__',\n",
" '__init__',\n",
" '__invert__',\n",
" '__ipow__',\n",
" '__isub__',\n",
" '__iter__',\n",
" '__itruediv__',\n",
" '__le__',\n",
" '__len__',\n",
" '__lt__',\n",
" '__mod__',\n",
" '__module__',\n",
" '__mul__',\n",
" '__ne__',\n",
" '__neg__',\n",
" '__new__',\n",
" '__nonzero__',\n",
" '__or__',\n",
" '__pow__',\n",
" '__radd__',\n",
" '__rand__',\n",
" '__rdiv__',\n",
" '__reduce__',\n",
" '__reduce_ex__',\n",
" '__repr__',\n",
" '__rfloordiv__',\n",
" '__rmod__',\n",
" '__rmul__',\n",
" '__ror__',\n",
" '__rpow__',\n",
" '__rsub__',\n",
" '__rtruediv__',\n",
" '__rxor__',\n",
" '__setattr__',\n",
" '__setitem__',\n",
" '__setstate__',\n",
" '__sizeof__',\n",
" '__str__',\n",
" '__sub__',\n",
" '__subclasshook__',\n",
" '__truediv__',\n",
" '__unicode__',\n",
" '__weakref__',\n",
" '__xor__',\n",
" '_accessors',\n",
" '_add_numeric_operations',\n",
" '_agg_by_level',\n",
" '_align_frame',\n",
" '_align_series',\n",
" '_apply_broadcast',\n",
" '_apply_empty_result',\n",
" '_apply_raw',\n",
" '_apply_standard',\n",
" '_at',\n",
" '_auto_consolidate',\n",
" '_box_col_values',\n",
" '_box_item_values',\n",
" '_check_inplace_setting',\n",
" '_check_is_chained_assignment_possible',\n",
" '_check_setitem_copy',\n",
" '_clear_item_cache',\n",
" '_combine_const',\n",
" '_combine_frame',\n",
" '_combine_match_columns',\n",
" '_combine_match_index',\n",
" '_combine_series',\n",
" '_combine_series_infer',\n",
" '_compare_frame',\n",
" '_compare_frame_evaluate',\n",
" '_consolidate_inplace',\n",
" '_construct_axes_dict',\n",
" '_construct_axes_dict_for_slice',\n",
" '_construct_axes_dict_from',\n",
" '_construct_axes_from_arguments',\n",
" '_constructor',\n",
" '_constructor_expanddim',\n",
" '_constructor_sliced',\n",
" '_count_level',\n",
" '_create_indexer',\n",
" '_dir_additions',\n",
" '_dir_deletions',\n",
" '_ensure_valid_index',\n",
" '_expand_axes',\n",
" '_flex_compare_frame',\n",
" '_from_arrays',\n",
" '_from_axes',\n",
" '_get_agg_axis',\n",
" '_get_axis',\n",
" '_get_axis_name',\n",
" '_get_axis_number',\n",
" '_get_axis_resolvers',\n",
" '_get_block_manager_axis',\n",
" '_get_bool_data',\n",
" '_get_cacher',\n",
" '_get_index_resolvers',\n",
" '_get_item_cache',\n",
" '_get_numeric_data',\n",
" '_get_values',\n",
" '_getitem_array',\n",
" '_getitem_column',\n",
" '_getitem_frame',\n",
" '_getitem_multilevel',\n",
" '_getitem_slice',\n",
" '_iat',\n",
" '_iget_item_cache',\n",
" '_iloc',\n",
" '_indexed_same',\n",
" '_info_axis',\n",
" '_info_axis_name',\n",
" '_info_axis_number',\n",
" '_info_repr',\n",
" '_init_dict',\n",
" '_init_mgr',\n",
" '_init_ndarray',\n",
" '_internal_names',\n",
" '_internal_names_set',\n",
" '_is_cached',\n",
" '_is_datelike_mixed_type',\n",
" '_is_mixed_type',\n",
" '_is_numeric_mixed_type',\n",
" '_is_view',\n",
" '_ix',\n",
" '_ixs',\n",
" '_join_compat',\n",
" '_loc',\n",
" '_maybe_cache_changed',\n",
" '_maybe_update_cacher',\n",
" '_metadata',\n",
" '_needs_reindex_multi',\n",
" '_protect_consolidate',\n",
" '_reduce',\n",
" '_reindex_axes',\n",
" '_reindex_axis',\n",
" '_reindex_columns',\n",
" '_reindex_index',\n",
" '_reindex_multi',\n",
" '_reindex_with_indexers',\n",
" '_repr_fits_horizontal_',\n",
" '_repr_fits_vertical_',\n",
" '_repr_html_',\n",
" '_reset_cache',\n",
" '_sanitize_column',\n",
" '_series',\n",
" '_set_as_cached',\n",
" '_set_axis',\n",
" '_set_is_copy',\n",
" '_set_item',\n",
" '_setitem_array',\n",
" '_setitem_frame',\n",
" '_setitem_slice',\n",
" '_setup_axes',\n",
" '_slice',\n",
" '_stat_axis',\n",
" '_stat_axis_name',\n",
" '_stat_axis_number',\n",
" '_typ',\n",
" '_unpickle_frame_compat',\n",
" '_unpickle_matrix_compat',\n",
" '_update_inplace',\n",
" '_validate_dtype',\n",
" '_xs',\n",
" 'abs',\n",
" 'add',\n",
" 'add_prefix',\n",
" 'add_suffix',\n",
" 'age',\n",
" 'align',\n",
" 'all',\n",
" 'any',\n",
" 'append',\n",
" 'apply',\n",
" 'applymap',\n",
" 'as_blocks',\n",
" 'as_matrix',\n",
" 'asfreq',\n",
" 'assign',\n",
" 'astype',\n",
" 'at',\n",
" 'at_time',\n",
" 'axes',\n",
" 'between_time',\n",
" 'bfill',\n",
" 'black',\n",
" 'blocks',\n",
" 'bool',\n",
" 'boxplot',\n",
" 'chas',\n",
" 'clip',\n",
" 'clip_lower',\n",
" 'clip_upper',\n",
" 'columns',\n",
" 'combine',\n",
" 'combineAdd',\n",
" 'combineMult',\n",
" 'combine_first',\n",
" 'compound',\n",
" 'consolidate',\n",
" 'convert_objects',\n",
" 'copy',\n",
" 'corr',\n",
" 'corrwith',\n",
" 'count',\n",
" 'cov',\n",
" 'crim',\n",
" 'cummax',\n",
" 'cummin',\n",
" 'cumprod',\n",
" 'cumsum',\n",
" 'describe',\n",
" 'diff',\n",
" 'dis',\n",
" 'div',\n",
" 'divide',\n",
" 'dot',\n",
" 'drop',\n",
" 'drop_duplicates',\n",
" 'dropna',\n",
" 'dtypes',\n",
" 'duplicated',\n",
" 'empty',\n",
" 'eq',\n",
" 'equals',\n",
" 'eval',\n",
" 'ffill',\n",
" 'fillna',\n",
" 'filter',\n",
" 'first',\n",
" 'first_valid_index',\n",
" 'floordiv',\n",
" 'from_csv',\n",
" 'from_dict',\n",
" 'from_items',\n",
" 'from_records',\n",
" 'ftypes',\n",
" 'ge',\n",
" 'get',\n",
" 'get_dtype_counts',\n",
" 'get_ftype_counts',\n",
" 'get_value',\n",
" 'get_values',\n",
" 'groupby',\n",
" 'gt',\n",
" 'head',\n",
" 'hist',\n",
" 'iat',\n",
" 'icol',\n",
" 'idxmax',\n",
" 'idxmin',\n",
" 'iget_value',\n",
" 'iloc',\n",
" 'index',\n",
" 'indus',\n",
" 'info',\n",
" 'insert',\n",
" 'interpolate',\n",
" 'irow',\n",
" 'is_copy',\n",
" 'isin',\n",
" 'isnull',\n",
" 'items',\n",
" 'iteritems',\n",
" 'iterkv',\n",
" 'iterrows',\n",
" 'itertuples',\n",
" 'ix',\n",
" 'join',\n",
" 'keys',\n",
" 'kurt',\n",
" 'kurtosis',\n",
" 'last',\n",
" 'last_valid_index',\n",
" 'le',\n",
" 'load',\n",
" 'loc',\n",
" 'lookup',\n",
" 'lstat',\n",
" 'lt',\n",
" 'mad',\n",
" 'mask',\n",
" 'max',\n",
" 'mean',\n",
" 'median',\n",
" 'medv',\n",
" 'memory_usage',\n",
" 'merge',\n",
" 'min',\n",
" 'mod',\n",
" 'mode',\n",
" 'mul',\n",
" 'multiply',\n",
" 'ndim',\n",
" 'ne',\n",
" 'notnull',\n",
" 'nox',\n",
" 'pct_change',\n",
" 'pipe',\n",
" 'pivot',\n",
" 'pivot_table',\n",
" 'plot',\n",
" 'pop',\n",
" 'pow',\n",
" 'prod',\n",
" 'product',\n",
" 'ptratio',\n",
" 'quantile',\n",
" 'query',\n",
" 'rad',\n",
" 'radd',\n",
" 'rank',\n",
" 'rdiv',\n",
" 'reindex',\n",
" 'reindex_axis',\n",
" 'reindex_like',\n",
" 'rename',\n",
" 'rename_axis',\n",
" 'reorder_levels',\n",
" 'replace',\n",
" 'resample',\n",
" 'reset_index',\n",
" 'rfloordiv',\n",
" 'rm',\n",
" 'rmod',\n",
" 'rmul',\n",
" 'rpow',\n",
" 'rsub',\n",
" 'rtruediv',\n",
" 'sample',\n",
" 'save',\n",
" 'select',\n",
" 'select_dtypes',\n",
" 'sem',\n",
" 'set_axis',\n",
" 'set_index',\n",
" 'set_value',\n",
" 'shape',\n",
" 'shift',\n",
" 'size',\n",
" 'skew',\n",
" 'slice_shift',\n",
" 'sort',\n",
" 'sort_index',\n",
" 'sortlevel',\n",
" 'squeeze',\n",
" 'stack',\n",
" 'std',\n",
" 'sub',\n",
" 'subtract',\n",
" 'sum',\n",
" 'swapaxes',\n",
" 'swaplevel',\n",
" 'tail',\n",
" 'take',\n",
" 'tax',\n",
" 'to_clipboard',\n",
" 'to_csv',\n",
" 'to_dense',\n",
" 'to_dict',\n",
" 'to_excel',\n",
" 'to_gbq',\n",
" 'to_hdf',\n",
" 'to_html',\n",
" 'to_json',\n",
" 'to_latex',\n",
" 'to_msgpack',\n",
" 'to_panel',\n",
" 'to_period',\n",
" 'to_pickle',\n",
" 'to_records',\n",
" 'to_sparse',\n",
" 'to_sql',\n",
" 'to_stata',\n",
" 'to_string',\n",
" 'to_timestamp',\n",
" 'to_wide',\n",
" 'transpose',\n",
" 'truediv',\n",
" 'truncate',\n",
" 'tshift',\n",
" 'tz_convert',\n",
" 'tz_localize',\n",
" 'unstack',\n",
" 'update',\n",
" 'values',\n",
" 'var',\n",
" 'where',\n",
" 'xs',\n",
" 'zn']"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dir(Boston) #What are the various commands we can run on Boston"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>0.00632</td>\n",
" <td>18</td>\n",
" <td>2.31</td>\n",
" <td>0</td>\n",
" <td>0.538</td>\n",
" <td>6.575</td>\n",
" <td>65.2</td>\n",
" <td>4.0900</td>\n",
" <td>1</td>\n",
" <td>296</td>\n",
" <td>15.3</td>\n",
" <td>396.90</td>\n",
" <td>4.98</td>\n",
" <td>24.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>0.02731</td>\n",
" <td>0</td>\n",
" <td>7.07</td>\n",
" <td>0</td>\n",
" <td>0.469</td>\n",
" <td>6.421</td>\n",
" <td>78.9</td>\n",
" <td>4.9671</td>\n",
" <td>2</td>\n",
" <td>242</td>\n",
" <td>17.8</td>\n",
" <td>396.90</td>\n",
" <td>9.14</td>\n",
" <td>21.6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>0.02729</td>\n",
" <td>0</td>\n",
" <td>7.07</td>\n",
" <td>0</td>\n",
" <td>0.469</td>\n",
" <td>7.185</td>\n",
" <td>61.1</td>\n",
" <td>4.9671</td>\n",
" <td>2</td>\n",
" <td>242</td>\n",
" <td>17.8</td>\n",
" <td>392.83</td>\n",
" <td>4.03</td>\n",
" <td>34.7</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax ptratio \\\n",
"0 0.00632 18 2.31 0 0.538 6.575 65.2 4.0900 1 296 15.3 \n",
"1 0.02731 0 7.07 0 0.469 6.421 78.9 4.9671 2 242 17.8 \n",
"2 0.02729 0 7.07 0 0.469 7.185 61.1 4.9671 2 242 17.8 \n",
"\n",
" black lstat medv \n",
"0 396.90 4.98 24.0 \n",
"1 396.90 9.14 21.6 \n",
"2 392.83 4.03 34.7 "
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston[0:3] #Gives rows from first row to third row. In python index starts from 0 while in R it starts from 1."
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>501</th>\n",
" <td>0.06263</td>\n",
" <td>0</td>\n",
" <td>11.93</td>\n",
" <td>0</td>\n",
" <td>0.573</td>\n",
" <td>6.593</td>\n",
" <td>69.1</td>\n",
" <td>2.4786</td>\n",
" <td>1</td>\n",
" <td>273</td>\n",
" <td>21</td>\n",
" <td>391.99</td>\n",
" <td>9.67</td>\n",
" <td>22.4</td>\n",
" </tr>\n",
" <tr>\n",
" <th>502</th>\n",
" <td>0.04527</td>\n",
" <td>0</td>\n",
" <td>11.93</td>\n",
" <td>0</td>\n",
" <td>0.573</td>\n",
" <td>6.120</td>\n",
" <td>76.7</td>\n",
" <td>2.2875</td>\n",
" <td>1</td>\n",
" <td>273</td>\n",
" <td>21</td>\n",
" <td>396.90</td>\n",
" <td>9.08</td>\n",
" <td>20.6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>503</th>\n",
" <td>0.06076</td>\n",
" <td>0</td>\n",
" <td>11.93</td>\n",
" <td>0</td>\n",
" <td>0.573</td>\n",
" <td>6.976</td>\n",
" <td>91.0</td>\n",
" <td>2.1675</td>\n",
" <td>1</td>\n",
" <td>273</td>\n",
" <td>21</td>\n",
" <td>396.90</td>\n",
" <td>5.64</td>\n",
" <td>23.9</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax ptratio \\\n",
"501 0.06263 0 11.93 0 0.573 6.593 69.1 2.4786 1 273 21 \n",
"502 0.04527 0 11.93 0 0.573 6.120 76.7 2.2875 1 273 21 \n",
"503 0.06076 0 11.93 0 0.573 6.976 91.0 2.1675 1 273 21 \n",
"\n",
" black lstat medv \n",
"501 391.99 9.67 22.4 \n",
"502 396.90 9.08 20.6 \n",
"503 396.90 5.64 23.9 "
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston[-5:504] #Gives rows from 506(total rows)-5 to the row number specified. \n",
"#Note index is one less than row number unlike R"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>medv</th>\n",
" <th>rm</th>\n",
" <th>chas</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>24.0</td>\n",
" <td>6.575</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>21.6</td>\n",
" <td>6.421</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>34.7</td>\n",
" <td>7.185</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>33.4</td>\n",
" <td>6.998</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>36.2</td>\n",
" <td>7.147</td>\n",
" <td>0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" medv rm chas\n",
"0 24.0 6.575 0\n",
"1 21.6 6.421 0\n",
"2 34.7 7.185 0\n",
"3 33.4 6.998 0\n",
"4 36.2 7.147 0"
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston[['medv','rm','chas']].head() #Note the double square brackets [[]]"
]
},
{
"cell_type": "code",
"execution_count": 28,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>medv</th>\n",
" <th>rm</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>33.4</td>\n",
" <td>6.998</td>\n",
" <td>0</td>\n",
" <td>0.458</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>36.2</td>\n",
" <td>7.147</td>\n",
" <td>0</td>\n",
" <td>0.458</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>28.7</td>\n",
" <td>6.430</td>\n",
" <td>0</td>\n",
" <td>0.458</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>22.9</td>\n",
" <td>6.012</td>\n",
" <td>0</td>\n",
" <td>0.524</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>27.1</td>\n",
" <td>6.172</td>\n",
" <td>0</td>\n",
" <td>0.524</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8</th>\n",
" <td>16.5</td>\n",
" <td>5.631</td>\n",
" <td>0</td>\n",
" <td>0.524</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>18.9</td>\n",
" <td>6.004</td>\n",
" <td>0</td>\n",
" <td>0.524</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>15.0</td>\n",
" <td>6.377</td>\n",
" <td>0</td>\n",
" <td>0.524</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" medv rm chas nox\n",
"3 33.4 6.998 0 0.458\n",
"4 36.2 7.147 0 0.458\n",
"5 28.7 6.430 0 0.458\n",
"6 22.9 6.012 0 0.524\n",
"7 27.1 6.172 0 0.524\n",
"8 16.5 5.631 0 0.524\n",
"9 18.9 6.004 0 0.524\n",
"10 15.0 6.377 0 0.524"
]
},
"execution_count": 28,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.ix[3:10,['medv','rm','chas','nox']] \n",
"#Note the use of command ix as well as putting row numbers and column names seperately"
]
},
{
"cell_type": "code",
"execution_count": 39,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"0 False\n",
"1 False\n",
"2 False\n",
"3 False\n",
"4 False\n",
"5 False\n",
"6 False\n",
"7 False\n",
"8 False\n",
"9 False\n",
"10 False\n",
"11 False\n",
"12 False\n",
"13 False\n",
"14 False\n",
"15 False\n",
"16 False\n",
"17 False\n",
"18 False\n",
"19 False\n",
"20 False\n",
"21 False\n",
"22 False\n",
"23 False\n",
"24 False\n",
"25 False\n",
"26 False\n",
"27 False\n",
"28 False\n",
"29 False\n",
" ... \n",
"476 False\n",
"477 False\n",
"478 False\n",
"479 False\n",
"480 False\n",
"481 False\n",
"482 False\n",
"483 False\n",
"484 False\n",
"485 False\n",
"486 False\n",
"487 False\n",
"488 False\n",
"489 False\n",
"490 False\n",
"491 False\n",
"492 False\n",
"493 False\n",
"494 False\n",
"495 False\n",
"496 False\n",
"497 False\n",
"498 False\n",
"499 False\n",
"500 False\n",
"501 False\n",
"502 False\n",
"503 False\n",
"504 False\n",
"505 False\n",
"Name: medv, dtype: bool"
]
},
"execution_count": 39,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston['medv']>49"
]
},
{
"cell_type": "code",
"execution_count": 38,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>1.46336</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.489</td>\n",
" <td>90.8</td>\n",
" <td>1.9709</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>374.43</td>\n",
" <td>1.73</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>162</th>\n",
" <td>1.83377</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>1</td>\n",
" <td>0.6050</td>\n",
" <td>7.802</td>\n",
" <td>98.2</td>\n",
" <td>2.0407</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>389.61</td>\n",
" <td>1.92</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>1.51902</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>1</td>\n",
" <td>0.6050</td>\n",
" <td>8.375</td>\n",
" <td>93.9</td>\n",
" <td>2.1620</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>388.45</td>\n",
" <td>3.32</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>166</th>\n",
" <td>2.01019</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.929</td>\n",
" <td>96.2</td>\n",
" <td>2.0459</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>369.30</td>\n",
" <td>3.70</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>186</th>\n",
" <td>0.05602</td>\n",
" <td>0</td>\n",
" <td>2.46</td>\n",
" <td>0</td>\n",
" <td>0.4880</td>\n",
" <td>7.831</td>\n",
" <td>53.6</td>\n",
" <td>3.1992</td>\n",
" <td>3</td>\n",
" <td>193</td>\n",
" <td>17.8</td>\n",
" <td>392.63</td>\n",
" <td>4.45</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>195</th>\n",
" <td>0.01381</td>\n",
" <td>80</td>\n",
" <td>0.46</td>\n",
" <td>0</td>\n",
" <td>0.4220</td>\n",
" <td>7.875</td>\n",
" <td>32.0</td>\n",
" <td>5.6484</td>\n",
" <td>4</td>\n",
" <td>255</td>\n",
" <td>14.4</td>\n",
" <td>394.23</td>\n",
" <td>2.97</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>204</th>\n",
" <td>0.02009</td>\n",
" <td>95</td>\n",
" <td>2.68</td>\n",
" <td>0</td>\n",
" <td>0.4161</td>\n",
" <td>8.034</td>\n",
" <td>31.9</td>\n",
" <td>5.1180</td>\n",
" <td>4</td>\n",
" <td>224</td>\n",
" <td>14.7</td>\n",
" <td>390.55</td>\n",
" <td>2.88</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>225</th>\n",
" <td>0.52693</td>\n",
" <td>0</td>\n",
" <td>6.20</td>\n",
" <td>0</td>\n",
" <td>0.5040</td>\n",
" <td>8.725</td>\n",
" <td>83.0</td>\n",
" <td>2.8944</td>\n",
" <td>8</td>\n",
" <td>307</td>\n",
" <td>17.4</td>\n",
" <td>382.00</td>\n",
" <td>4.63</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>257</th>\n",
" <td>0.61154</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.6470</td>\n",
" <td>8.704</td>\n",
" <td>86.9</td>\n",
" <td>1.8010</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>389.70</td>\n",
" <td>5.12</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>267</th>\n",
" <td>0.57834</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.5750</td>\n",
" <td>8.297</td>\n",
" <td>67.0</td>\n",
" <td>2.4216</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>384.54</td>\n",
" <td>7.44</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>283</th>\n",
" <td>0.01501</td>\n",
" <td>90</td>\n",
" <td>1.21</td>\n",
" <td>1</td>\n",
" <td>0.4010</td>\n",
" <td>7.923</td>\n",
" <td>24.8</td>\n",
" <td>5.8850</td>\n",
" <td>1</td>\n",
" <td>198</td>\n",
" <td>13.6</td>\n",
" <td>395.52</td>\n",
" <td>3.16</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>368</th>\n",
" <td>4.89822</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>4.970</td>\n",
" <td>100.0</td>\n",
" <td>1.3325</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>375.52</td>\n",
" <td>3.26</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>369</th>\n",
" <td>5.66998</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6310</td>\n",
" <td>6.683</td>\n",
" <td>96.8</td>\n",
" <td>1.3567</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>375.33</td>\n",
" <td>3.73</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>370</th>\n",
" <td>6.53876</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6310</td>\n",
" <td>7.016</td>\n",
" <td>97.5</td>\n",
" <td>1.2024</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>392.05</td>\n",
" <td>2.96</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>371</th>\n",
" <td>9.23230</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>6.216</td>\n",
" <td>100.0</td>\n",
" <td>1.1691</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>366.15</td>\n",
" <td>9.53</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>372</th>\n",
" <td>8.26725</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6680</td>\n",
" <td>5.875</td>\n",
" <td>89.6</td>\n",
" <td>1.1296</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>347.88</td>\n",
" <td>8.88</td>\n",
" <td>50</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax \\\n",
"161 1.46336 0 19.58 0 0.6050 7.489 90.8 1.9709 5 403 \n",
"162 1.83377 0 19.58 1 0.6050 7.802 98.2 2.0407 5 403 \n",
"163 1.51902 0 19.58 1 0.6050 8.375 93.9 2.1620 5 403 \n",
"166 2.01019 0 19.58 0 0.6050 7.929 96.2 2.0459 5 403 \n",
"186 0.05602 0 2.46 0 0.4880 7.831 53.6 3.1992 3 193 \n",
"195 0.01381 80 0.46 0 0.4220 7.875 32.0 5.6484 4 255 \n",
"204 0.02009 95 2.68 0 0.4161 8.034 31.9 5.1180 4 224 \n",
"225 0.52693 0 6.20 0 0.5040 8.725 83.0 2.8944 8 307 \n",
"257 0.61154 20 3.97 0 0.6470 8.704 86.9 1.8010 5 264 \n",
"267 0.57834 20 3.97 0 0.5750 8.297 67.0 2.4216 5 264 \n",
"283 0.01501 90 1.21 1 0.4010 7.923 24.8 5.8850 1 198 \n",
"368 4.89822 0 18.10 0 0.6310 4.970 100.0 1.3325 24 666 \n",
"369 5.66998 0 18.10 1 0.6310 6.683 96.8 1.3567 24 666 \n",
"370 6.53876 0 18.10 1 0.6310 7.016 97.5 1.2024 24 666 \n",
"371 9.23230 0 18.10 0 0.6310 6.216 100.0 1.1691 24 666 \n",
"372 8.26725 0 18.10 1 0.6680 5.875 89.6 1.1296 24 666 \n",
"\n",
" ptratio black lstat medv \n",
"161 14.7 374.43 1.73 50 \n",
"162 14.7 389.61 1.92 50 \n",
"163 14.7 388.45 3.32 50 \n",
"166 14.7 369.30 3.70 50 \n",
"186 17.8 392.63 4.45 50 \n",
"195 14.4 394.23 2.97 50 \n",
"204 14.7 390.55 2.88 50 \n",
"225 17.4 382.00 4.63 50 \n",
"257 13.0 389.70 5.12 50 \n",
"267 13.0 384.54 7.44 50 \n",
"283 13.6 395.52 3.16 50 \n",
"368 20.2 375.52 3.26 50 \n",
"369 20.2 375.33 3.73 50 \n",
"370 20.2 392.05 2.96 50 \n",
"371 20.2 366.15 9.53 50 \n",
"372 20.2 347.88 8.88 50 "
]
},
"execution_count": 38,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston[Boston['medv']>49]"
]
},
{
"cell_type": "code",
"execution_count": 47,
"metadata": {
"collapsed": false
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/ajay/anaconda3/lib/python3.4/site-packages/pandas/core/frame.py:1825: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" \"DataFrame index.\", UserWarning)\n"
]
},
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>1.46336</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.489</td>\n",
" <td>90.8</td>\n",
" <td>1.9709</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>374.43</td>\n",
" <td>1.73</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>166</th>\n",
" <td>2.01019</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.929</td>\n",
" <td>96.2</td>\n",
" <td>2.0459</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>369.30</td>\n",
" <td>3.70</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>186</th>\n",
" <td>0.05602</td>\n",
" <td>0</td>\n",
" <td>2.46</td>\n",
" <td>0</td>\n",
" <td>0.4880</td>\n",
" <td>7.831</td>\n",
" <td>53.6</td>\n",
" <td>3.1992</td>\n",
" <td>3</td>\n",
" <td>193</td>\n",
" <td>17.8</td>\n",
" <td>392.63</td>\n",
" <td>4.45</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>195</th>\n",
" <td>0.01381</td>\n",
" <td>80</td>\n",
" <td>0.46</td>\n",
" <td>0</td>\n",
" <td>0.4220</td>\n",
" <td>7.875</td>\n",
" <td>32.0</td>\n",
" <td>5.6484</td>\n",
" <td>4</td>\n",
" <td>255</td>\n",
" <td>14.4</td>\n",
" <td>394.23</td>\n",
" <td>2.97</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>204</th>\n",
" <td>0.02009</td>\n",
" <td>95</td>\n",
" <td>2.68</td>\n",
" <td>0</td>\n",
" <td>0.4161</td>\n",
" <td>8.034</td>\n",
" <td>31.9</td>\n",
" <td>5.1180</td>\n",
" <td>4</td>\n",
" <td>224</td>\n",
" <td>14.7</td>\n",
" <td>390.55</td>\n",
" <td>2.88</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>225</th>\n",
" <td>0.52693</td>\n",
" <td>0</td>\n",
" <td>6.20</td>\n",
" <td>0</td>\n",
" <td>0.5040</td>\n",
" <td>8.725</td>\n",
" <td>83.0</td>\n",
" <td>2.8944</td>\n",
" <td>8</td>\n",
" <td>307</td>\n",
" <td>17.4</td>\n",
" <td>382.00</td>\n",
" <td>4.63</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>257</th>\n",
" <td>0.61154</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.6470</td>\n",
" <td>8.704</td>\n",
" <td>86.9</td>\n",
" <td>1.8010</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>389.70</td>\n",
" <td>5.12</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>267</th>\n",
" <td>0.57834</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.5750</td>\n",
" <td>8.297</td>\n",
" <td>67.0</td>\n",
" <td>2.4216</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>384.54</td>\n",
" <td>7.44</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>368</th>\n",
" <td>4.89822</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>4.970</td>\n",
" <td>100.0</td>\n",
" <td>1.3325</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>375.52</td>\n",
" <td>3.26</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>371</th>\n",
" <td>9.23230</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>6.216</td>\n",
" <td>100.0</td>\n",
" <td>1.1691</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>366.15</td>\n",
" <td>9.53</td>\n",
" <td>50</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax \\\n",
"161 1.46336 0 19.58 0 0.6050 7.489 90.8 1.9709 5 403 \n",
"166 2.01019 0 19.58 0 0.6050 7.929 96.2 2.0459 5 403 \n",
"186 0.05602 0 2.46 0 0.4880 7.831 53.6 3.1992 3 193 \n",
"195 0.01381 80 0.46 0 0.4220 7.875 32.0 5.6484 4 255 \n",
"204 0.02009 95 2.68 0 0.4161 8.034 31.9 5.1180 4 224 \n",
"225 0.52693 0 6.20 0 0.5040 8.725 83.0 2.8944 8 307 \n",
"257 0.61154 20 3.97 0 0.6470 8.704 86.9 1.8010 5 264 \n",
"267 0.57834 20 3.97 0 0.5750 8.297 67.0 2.4216 5 264 \n",
"368 4.89822 0 18.10 0 0.6310 4.970 100.0 1.3325 24 666 \n",
"371 9.23230 0 18.10 0 0.6310 6.216 100.0 1.1691 24 666 \n",
"\n",
" ptratio black lstat medv \n",
"161 14.7 374.43 1.73 50 \n",
"166 14.7 369.30 3.70 50 \n",
"186 17.8 392.63 4.45 50 \n",
"195 14.4 394.23 2.97 50 \n",
"204 14.7 390.55 2.88 50 \n",
"225 17.4 382.00 4.63 50 \n",
"257 13.0 389.70 5.12 50 \n",
"267 13.0 384.54 7.44 50 \n",
"368 20.2 375.52 3.26 50 \n",
"371 20.2 366.15 9.53 50 "
]
},
"execution_count": 47,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston[Boston['medv']>49 ][Boston['chas']==0]"
]
},
{
"cell_type": "code",
"execution_count": 48,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>1.51902</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>1</td>\n",
" <td>0.6050</td>\n",
" <td>8.375</td>\n",
" <td>93.9</td>\n",
" <td>2.1620</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>388.45</td>\n",
" <td>3.32</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>204</th>\n",
" <td>0.02009</td>\n",
" <td>95</td>\n",
" <td>2.68</td>\n",
" <td>0</td>\n",
" <td>0.4161</td>\n",
" <td>8.034</td>\n",
" <td>31.9</td>\n",
" <td>5.1180</td>\n",
" <td>4</td>\n",
" <td>224</td>\n",
" <td>14.7</td>\n",
" <td>390.55</td>\n",
" <td>2.88</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>225</th>\n",
" <td>0.52693</td>\n",
" <td>0</td>\n",
" <td>6.20</td>\n",
" <td>0</td>\n",
" <td>0.5040</td>\n",
" <td>8.725</td>\n",
" <td>83.0</td>\n",
" <td>2.8944</td>\n",
" <td>8</td>\n",
" <td>307</td>\n",
" <td>17.4</td>\n",
" <td>382.00</td>\n",
" <td>4.63</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>257</th>\n",
" <td>0.61154</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.6470</td>\n",
" <td>8.704</td>\n",
" <td>86.9</td>\n",
" <td>1.8010</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>389.70</td>\n",
" <td>5.12</td>\n",
" <td>50</td>\n",
" </tr>\n",
" <tr>\n",
" <th>267</th>\n",
" <td>0.57834</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.5750</td>\n",
" <td>8.297</td>\n",
" <td>67.0</td>\n",
" <td>2.4216</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>384.54</td>\n",
" <td>7.44</td>\n",
" <td>50</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax ptratio \\\n",
"163 1.51902 0 19.58 1 0.6050 8.375 93.9 2.1620 5 403 14.7 \n",
"204 0.02009 95 2.68 0 0.4161 8.034 31.9 5.1180 4 224 14.7 \n",
"225 0.52693 0 6.20 0 0.5040 8.725 83.0 2.8944 8 307 17.4 \n",
"257 0.61154 20 3.97 0 0.6470 8.704 86.9 1.8010 5 264 13.0 \n",
"267 0.57834 20 3.97 0 0.5750 8.297 67.0 2.4216 5 264 13.0 \n",
"\n",
" black lstat medv \n",
"163 388.45 3.32 50 \n",
"204 390.55 2.88 50 \n",
"225 382.00 4.63 50 \n",
"257 389.70 5.12 50 \n",
"267 384.54 7.44 50 "
]
},
"execution_count": 48,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.query('medv >49 and rm >8')"
]
},
{
"cell_type": "code",
"execution_count": 52,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>crim</th>\n",
" <th>zn</th>\n",
" <th>indus</th>\n",
" <th>chas</th>\n",
" <th>nox</th>\n",
" <th>rm</th>\n",
" <th>age</th>\n",
" <th>dis</th>\n",
" <th>rad</th>\n",
" <th>tax</th>\n",
" <th>ptratio</th>\n",
" <th>black</th>\n",
" <th>lstat</th>\n",
" <th>medv</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>161</th>\n",
" <td>1.46336</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.489</td>\n",
" <td>90.8</td>\n",
" <td>1.9709</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>374.43</td>\n",
" <td>1.73</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>162</th>\n",
" <td>1.83377</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>1</td>\n",
" <td>0.6050</td>\n",
" <td>7.802</td>\n",
" <td>98.2</td>\n",
" <td>2.0407</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>389.61</td>\n",
" <td>1.92</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>163</th>\n",
" <td>1.51902</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>1</td>\n",
" <td>0.6050</td>\n",
" <td>8.375</td>\n",
" <td>93.9</td>\n",
" <td>2.1620</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>388.45</td>\n",
" <td>3.32</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>166</th>\n",
" <td>2.01019</td>\n",
" <td>0</td>\n",
" <td>19.58</td>\n",
" <td>0</td>\n",
" <td>0.6050</td>\n",
" <td>7.929</td>\n",
" <td>96.2</td>\n",
" <td>2.0459</td>\n",
" <td>5</td>\n",
" <td>403</td>\n",
" <td>14.7</td>\n",
" <td>369.30</td>\n",
" <td>3.70</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>186</th>\n",
" <td>0.05602</td>\n",
" <td>0</td>\n",
" <td>2.46</td>\n",
" <td>0</td>\n",
" <td>0.4880</td>\n",
" <td>7.831</td>\n",
" <td>53.6</td>\n",
" <td>3.1992</td>\n",
" <td>3</td>\n",
" <td>193</td>\n",
" <td>17.8</td>\n",
" <td>392.63</td>\n",
" <td>4.45</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>195</th>\n",
" <td>0.01381</td>\n",
" <td>80</td>\n",
" <td>0.46</td>\n",
" <td>0</td>\n",
" <td>0.4220</td>\n",
" <td>7.875</td>\n",
" <td>32.0</td>\n",
" <td>5.6484</td>\n",
" <td>4</td>\n",
" <td>255</td>\n",
" <td>14.4</td>\n",
" <td>394.23</td>\n",
" <td>2.97</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>204</th>\n",
" <td>0.02009</td>\n",
" <td>95</td>\n",
" <td>2.68</td>\n",
" <td>0</td>\n",
" <td>0.4161</td>\n",
" <td>8.034</td>\n",
" <td>31.9</td>\n",
" <td>5.1180</td>\n",
" <td>4</td>\n",
" <td>224</td>\n",
" <td>14.7</td>\n",
" <td>390.55</td>\n",
" <td>2.88</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>225</th>\n",
" <td>0.52693</td>\n",
" <td>0</td>\n",
" <td>6.20</td>\n",
" <td>0</td>\n",
" <td>0.5040</td>\n",
" <td>8.725</td>\n",
" <td>83.0</td>\n",
" <td>2.8944</td>\n",
" <td>8</td>\n",
" <td>307</td>\n",
" <td>17.4</td>\n",
" <td>382.00</td>\n",
" <td>4.63</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>257</th>\n",
" <td>0.61154</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.6470</td>\n",
" <td>8.704</td>\n",
" <td>86.9</td>\n",
" <td>1.8010</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>389.70</td>\n",
" <td>5.12</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>267</th>\n",
" <td>0.57834</td>\n",
" <td>20</td>\n",
" <td>3.97</td>\n",
" <td>0</td>\n",
" <td>0.5750</td>\n",
" <td>8.297</td>\n",
" <td>67.0</td>\n",
" <td>2.4216</td>\n",
" <td>5</td>\n",
" <td>264</td>\n",
" <td>13.0</td>\n",
" <td>384.54</td>\n",
" <td>7.44</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>283</th>\n",
" <td>0.01501</td>\n",
" <td>90</td>\n",
" <td>1.21</td>\n",
" <td>1</td>\n",
" <td>0.4010</td>\n",
" <td>7.923</td>\n",
" <td>24.8</td>\n",
" <td>5.8850</td>\n",
" <td>1</td>\n",
" <td>198</td>\n",
" <td>13.6</td>\n",
" <td>395.52</td>\n",
" <td>3.16</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>365</th>\n",
" <td>4.55587</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.7180</td>\n",
" <td>3.561</td>\n",
" <td>87.9</td>\n",
" <td>1.6132</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>354.70</td>\n",
" <td>7.12</td>\n",
" <td>27.5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>367</th>\n",
" <td>13.52220</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>3.863</td>\n",
" <td>100.0</td>\n",
" <td>1.5106</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>131.42</td>\n",
" <td>13.33</td>\n",
" <td>23.1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>368</th>\n",
" <td>4.89822</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>4.970</td>\n",
" <td>100.0</td>\n",
" <td>1.3325</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>375.52</td>\n",
" <td>3.26</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>369</th>\n",
" <td>5.66998</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6310</td>\n",
" <td>6.683</td>\n",
" <td>96.8</td>\n",
" <td>1.3567</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>375.33</td>\n",
" <td>3.73</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>370</th>\n",
" <td>6.53876</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6310</td>\n",
" <td>7.016</td>\n",
" <td>97.5</td>\n",
" <td>1.2024</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>392.05</td>\n",
" <td>2.96</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>371</th>\n",
" <td>9.23230</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>0</td>\n",
" <td>0.6310</td>\n",
" <td>6.216</td>\n",
" <td>100.0</td>\n",
" <td>1.1691</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>366.15</td>\n",
" <td>9.53</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>372</th>\n",
" <td>8.26725</td>\n",
" <td>0</td>\n",
" <td>18.10</td>\n",
" <td>1</td>\n",
" <td>0.6680</td>\n",
" <td>5.875</td>\n",
" <td>89.6</td>\n",
" <td>1.1296</td>\n",
" <td>24</td>\n",
" <td>666</td>\n",
" <td>20.2</td>\n",
" <td>347.88</td>\n",
" <td>8.88</td>\n",
" <td>50.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" crim zn indus chas nox rm age dis rad tax \\\n",
"161 1.46336 0 19.58 0 0.6050 7.489 90.8 1.9709 5 403 \n",
"162 1.83377 0 19.58 1 0.6050 7.802 98.2 2.0407 5 403 \n",
"163 1.51902 0 19.58 1 0.6050 8.375 93.9 2.1620 5 403 \n",
"166 2.01019 0 19.58 0 0.6050 7.929 96.2 2.0459 5 403 \n",
"186 0.05602 0 2.46 0 0.4880 7.831 53.6 3.1992 3 193 \n",
"195 0.01381 80 0.46 0 0.4220 7.875 32.0 5.6484 4 255 \n",
"204 0.02009 95 2.68 0 0.4161 8.034 31.9 5.1180 4 224 \n",
"225 0.52693 0 6.20 0 0.5040 8.725 83.0 2.8944 8 307 \n",
"257 0.61154 20 3.97 0 0.6470 8.704 86.9 1.8010 5 264 \n",
"267 0.57834 20 3.97 0 0.5750 8.297 67.0 2.4216 5 264 \n",
"283 0.01501 90 1.21 1 0.4010 7.923 24.8 5.8850 1 198 \n",
"365 4.55587 0 18.10 0 0.7180 3.561 87.9 1.6132 24 666 \n",
"367 13.52220 0 18.10 0 0.6310 3.863 100.0 1.5106 24 666 \n",
"368 4.89822 0 18.10 0 0.6310 4.970 100.0 1.3325 24 666 \n",
"369 5.66998 0 18.10 1 0.6310 6.683 96.8 1.3567 24 666 \n",
"370 6.53876 0 18.10 1 0.6310 7.016 97.5 1.2024 24 666 \n",
"371 9.23230 0 18.10 0 0.6310 6.216 100.0 1.1691 24 666 \n",
"372 8.26725 0 18.10 1 0.6680 5.875 89.6 1.1296 24 666 \n",
"\n",
" ptratio black lstat medv \n",
"161 14.7 374.43 1.73 50.0 \n",
"162 14.7 389.61 1.92 50.0 \n",
"163 14.7 388.45 3.32 50.0 \n",
"166 14.7 369.30 3.70 50.0 \n",
"186 17.8 392.63 4.45 50.0 \n",
"195 14.4 394.23 2.97 50.0 \n",
"204 14.7 390.55 2.88 50.0 \n",
"225 17.4 382.00 4.63 50.0 \n",
"257 13.0 389.70 5.12 50.0 \n",
"267 13.0 384.54 7.44 50.0 \n",
"283 13.6 395.52 3.16 50.0 \n",
"365 20.2 354.70 7.12 27.5 \n",
"367 20.2 131.42 13.33 23.1 \n",
"368 20.2 375.52 3.26 50.0 \n",
"369 20.2 375.33 3.73 50.0 \n",
"370 20.2 392.05 2.96 50.0 \n",
"371 20.2 366.15 9.53 50.0 \n",
"372 20.2 347.88 8.88 50.0 "
]
},
"execution_count": 52,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Boston.query('medv >49 or rm <4')"
]
},
{
"cell_type": "code",
"execution_count": 54,
"metadata": {
"collapsed": false
},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.4.3"
}
},
"nbformat": 4,
"nbformat_minor": 0
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment