Created
December 2, 2014 10:35
-
-
Save mattions/61c850bc134dc837ce7c to your computer and use it in GitHub Desktop.
Just an idea | nbviewer: http://nbviewer.ipython.org/gist/mattions/61c850bc134dc837ce7c
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"metadata": { | |
"name": "", | |
"signature": "sha256:5835de2e10cb99253cfa1841c86b02e6b9ee8b2fb21e513bbaec771e6e006c1b" | |
}, | |
"nbformat": 3, | |
"nbformat_minor": 0, | |
"worksheets": [ | |
{ | |
"cells": [ | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"# Just an idea" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 1 | |
}, | |
{ | |
"cell_type": "markdown", | |
"metadata": {}, | |
"source": [ | |
"# Original test.ldj\n", | |
"\n", | |
"Valid JSON, only line by line\n", | |
"\n", | |
" {\"KEY3\": \"qux0\", \"KEY2\": \"baz0\", \"KEY1\": \"bar0\", \"KEY0\": \"foo0\", \"POS\": 5, \"CHROM\": \"chr3\"}\n", | |
" {\"KEY3\": \"qux1\", \"KEY2\": \"baz1\", \"KEY1\": \"bar1\", \"KEY0\": \"foo1\", \"POS\": 6, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux2\", \"KEY2\": \"baz2\", \"KEY1\": \"bar2\", \"KEY0\": \"foo2\", \"POS\": 9, \"CHROM\": \"chr1\"}\n", | |
" {\"KEY3\": \"qux3\", \"KEY2\": \"baz3\", \"KEY1\": \"bar3\", \"KEY0\": \"foo3\", \"POS\": 8, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux4\", \"KEY2\": \"baz4\", \"KEY1\": \"bar4\", \"KEY0\": \"foo4\", \"POS\": 3, \"CHROM\": \"chrX\"}\n", | |
" {\"KEY3\": \"qux5\", \"KEY2\": \"baz5\", \"KEY1\": \"bar5\", \"KEY0\": \"foo5\", \"POS\": 2, \"CHROM\": \"chrX\"}\n", | |
" {\"KEY3\": \"qux6\", \"KEY2\": \"baz6\", \"KEY1\": \"bar6\", \"KEY0\": \"foo6\", \"POS\": 10, \"CHROM\": \"chr3\"}\n", | |
" {\"KEY3\": \"qux7\", \"KEY2\": \"baz7\", \"KEY1\": \"bar7\", \"KEY0\": \"foo7\", \"POS\": 9, \"CHROM\": \"chr1\"}\n", | |
" {\"KEY3\": \"qux8\", \"KEY2\": \"baz8\", \"KEY1\": \"bar8\", \"KEY0\": \"foo8\", \"POS\": 0, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux9\", \"KEY2\": \"baz9\", \"KEY1\": \"bar9\", \"KEY0\": \"foo9\", \"POS\": 3, \"CHROM\": \"chr3\"}\n", | |
" {\"KEY3\": \"qux10\", \"KEY2\": \"baz10\", \"KEY1\": \"bar10\", \"KEY0\": \"foo10\", \"POS\": 8, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux11\", \"KEY2\": \"baz11\", \"KEY1\": \"bar11\", \"KEY0\": \"foo11\", \"POS\": 7, \"CHROM\": \"chrX\"}\n", | |
" {\"KEY3\": \"qux12\", \"KEY2\": \"baz12\", \"KEY1\": \"bar12\", \"KEY0\": \"foo12\", \"POS\": 6, \"CHROM\": \"chrX\"}\n", | |
" {\"KEY3\": \"qux13\", \"KEY2\": \"baz13\", \"KEY1\": \"bar13\", \"KEY0\": \"foo13\", \"POS\": 10, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux14\", \"KEY2\": \"baz14\", \"KEY1\": \"bar14\", \"KEY0\": \"foo14\", \"POS\": 3, \"CHROM\": \"chrX\"}\n", | |
" {\"KEY3\": \"qux15\", \"KEY2\": \"baz15\", \"KEY1\": \"bar15\", \"KEY0\": \"foo15\", \"POS\": 10, \"CHROM\": \"chr3\"}\n", | |
" {\"KEY3\": \"qux16\", \"KEY2\": \"baz16\", \"KEY1\": \"bar16\", \"KEY0\": \"foo16\", \"POS\": 2, \"CHROM\": \"chr12\"}\n", | |
" {\"KEY3\": \"qux17\", \"KEY2\": \"baz17\", \"KEY1\": \"bar17\", \"KEY0\": \"foo17\", \"POS\": 0, \"CHROM\": \"chr1\"}\n", | |
" {\"KEY3\": \"qux18\", \"KEY2\": \"baz18\", \"KEY1\": \"bar18\", \"KEY0\": \"foo18\", \"POS\": 6, \"CHROM\": \"chr3\"}\n", | |
" {\"KEY3\": \"qux19\", \"KEY2\": \"baz19\", \"KEY1\": \"bar19\", \"KEY0\": \"foo19\", \"POS\": 0, \"CHROM\": \"chr3\"}" | |
] | |
}, | |
{ | |
"cell_type": "markdown", | |
"metadata": {}, | |
"source": [ | |
"# Converted to json\n", | |
"Everyline gets a comma, except the last one and it becomes a list\n", | |
"\n", | |
" [{\"KEY3\": \"qux0\", \"KEY2\": \"baz0\", \"KEY1\": \"bar0\", \"KEY0\": \"foo0\", \"POS\": 5, \"CHROM\": \"chr3\"},\n", | |
" {\"KEY3\": \"qux1\", \"KEY2\": \"baz1\", \"KEY1\": \"bar1\", \"KEY0\": \"foo1\", \"POS\": 6, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux2\", \"KEY2\": \"baz2\", \"KEY1\": \"bar2\", \"KEY0\": \"foo2\", \"POS\": 9, \"CHROM\": \"chr1\"},\n", | |
" {\"KEY3\": \"qux3\", \"KEY2\": \"baz3\", \"KEY1\": \"bar3\", \"KEY0\": \"foo3\", \"POS\": 8, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux4\", \"KEY2\": \"baz4\", \"KEY1\": \"bar4\", \"KEY0\": \"foo4\", \"POS\": 3, \"CHROM\": \"chrX\"},\n", | |
" {\"KEY3\": \"qux5\", \"KEY2\": \"baz5\", \"KEY1\": \"bar5\", \"KEY0\": \"foo5\", \"POS\": 2, \"CHROM\": \"chrX\"},\n", | |
" {\"KEY3\": \"qux6\", \"KEY2\": \"baz6\", \"KEY1\": \"bar6\", \"KEY0\": \"foo6\", \"POS\": 10, \"CHROM\": \"chr3\"},\n", | |
" {\"KEY3\": \"qux7\", \"KEY2\": \"baz7\", \"KEY1\": \"bar7\", \"KEY0\": \"foo7\", \"POS\": 9, \"CHROM\": \"chr1\"},\n", | |
" {\"KEY3\": \"qux8\", \"KEY2\": \"baz8\", \"KEY1\": \"bar8\", \"KEY0\": \"foo8\", \"POS\": 0, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux9\", \"KEY2\": \"baz9\", \"KEY1\": \"bar9\", \"KEY0\": \"foo9\", \"POS\": 3, \"CHROM\": \"chr3\"},\n", | |
" {\"KEY3\": \"qux10\", \"KEY2\": \"baz10\", \"KEY1\": \"bar10\", \"KEY0\": \"foo10\", \"POS\": 8, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux11\", \"KEY2\": \"baz11\", \"KEY1\": \"bar11\", \"KEY0\": \"foo11\", \"POS\": 7, \"CHROM\": \"chrX\"},\n", | |
" {\"KEY3\": \"qux12\", \"KEY2\": \"baz12\", \"KEY1\": \"bar12\", \"KEY0\": \"foo12\", \"POS\": 6, \"CHROM\": \"chrX\"},\n", | |
" {\"KEY3\": \"qux13\", \"KEY2\": \"baz13\", \"KEY1\": \"bar13\", \"KEY0\": \"foo13\", \"POS\": 10, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux14\", \"KEY2\": \"baz14\", \"KEY1\": \"bar14\", \"KEY0\": \"foo14\", \"POS\": 3, \"CHROM\": \"chrX\"},\n", | |
" {\"KEY3\": \"qux15\", \"KEY2\": \"baz15\", \"KEY1\": \"bar15\", \"KEY0\": \"foo15\", \"POS\": 10, \"CHROM\": \"chr3\"},\n", | |
" {\"KEY3\": \"qux16\", \"KEY2\": \"baz16\", \"KEY1\": \"bar16\", \"KEY0\": \"foo16\", \"POS\": 2, \"CHROM\": \"chr12\"},\n", | |
" {\"KEY3\": \"qux17\", \"KEY2\": \"baz17\", \"KEY1\": \"bar17\", \"KEY0\": \"foo17\", \"POS\": 0, \"CHROM\": \"chr1\"},\n", | |
" {\"KEY3\": \"qux18\", \"KEY2\": \"baz18\", \"KEY1\": \"bar18\", \"KEY0\": \"foo18\", \"POS\": 6, \"CHROM\": \"chr3\"},\n", | |
" {\"KEY3\": \"qux19\", \"KEY2\": \"baz19\", \"KEY1\": \"bar19\", \"KEY0\": \"foo19\", \"POS\": 0, \"CHROM\": \"chr3\"}]" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"# Now we can put it in a pandas dataframe" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 2 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"converted_json = \"\"\"[{\"KEY3\": \"qux0\", \"KEY2\": \"baz0\", \"KEY1\": \"bar0\", \"KEY0\": \"foo0\", \"POS\": 5, \"CHROM\": \"chr3\"},\n", | |
"{\"KEY3\": \"qux1\", \"KEY2\": \"baz1\", \"KEY1\": \"bar1\", \"KEY0\": \"foo1\", \"POS\": 6, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux2\", \"KEY2\": \"baz2\", \"KEY1\": \"bar2\", \"KEY0\": \"foo2\", \"POS\": 9, \"CHROM\": \"chr1\"},\n", | |
"{\"KEY3\": \"qux3\", \"KEY2\": \"baz3\", \"KEY1\": \"bar3\", \"KEY0\": \"foo3\", \"POS\": 8, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux4\", \"KEY2\": \"baz4\", \"KEY1\": \"bar4\", \"KEY0\": \"foo4\", \"POS\": 3, \"CHROM\": \"chrX\"},\n", | |
"{\"KEY3\": \"qux5\", \"KEY2\": \"baz5\", \"KEY1\": \"bar5\", \"KEY0\": \"foo5\", \"POS\": 2, \"CHROM\": \"chrX\"},\n", | |
"{\"KEY3\": \"qux6\", \"KEY2\": \"baz6\", \"KEY1\": \"bar6\", \"KEY0\": \"foo6\", \"POS\": 10, \"CHROM\": \"chr3\"},\n", | |
"{\"KEY3\": \"qux7\", \"KEY2\": \"baz7\", \"KEY1\": \"bar7\", \"KEY0\": \"foo7\", \"POS\": 9, \"CHROM\": \"chr1\"},\n", | |
"{\"KEY3\": \"qux8\", \"KEY2\": \"baz8\", \"KEY1\": \"bar8\", \"KEY0\": \"foo8\", \"POS\": 0, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux9\", \"KEY2\": \"baz9\", \"KEY1\": \"bar9\", \"KEY0\": \"foo9\", \"POS\": 3, \"CHROM\": \"chr3\"},\n", | |
"{\"KEY3\": \"qux10\", \"KEY2\": \"baz10\", \"KEY1\": \"bar10\", \"KEY0\": \"foo10\", \"POS\": 8, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux11\", \"KEY2\": \"baz11\", \"KEY1\": \"bar11\", \"KEY0\": \"foo11\", \"POS\": 7, \"CHROM\": \"chrX\"},\n", | |
"{\"KEY3\": \"qux12\", \"KEY2\": \"baz12\", \"KEY1\": \"bar12\", \"KEY0\": \"foo12\", \"POS\": 6, \"CHROM\": \"chrX\"},\n", | |
"{\"KEY3\": \"qux13\", \"KEY2\": \"baz13\", \"KEY1\": \"bar13\", \"KEY0\": \"foo13\", \"POS\": 10, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux14\", \"KEY2\": \"baz14\", \"KEY1\": \"bar14\", \"KEY0\": \"foo14\", \"POS\": 3, \"CHROM\": \"chrX\"},\n", | |
"{\"KEY3\": \"qux15\", \"KEY2\": \"baz15\", \"KEY1\": \"bar15\", \"KEY0\": \"foo15\", \"POS\": 10, \"CHROM\": \"chr3\"},\n", | |
"{\"KEY3\": \"qux16\", \"KEY2\": \"baz16\", \"KEY1\": \"bar16\", \"KEY0\": \"foo16\", \"POS\": 2, \"CHROM\": \"chr12\"},\n", | |
"{\"KEY3\": \"qux17\", \"KEY2\": \"baz17\", \"KEY1\": \"bar17\", \"KEY0\": \"foo17\", \"POS\": 0, \"CHROM\": \"chr1\"},\n", | |
"{\"KEY3\": \"qux18\", \"KEY2\": \"baz18\", \"KEY1\": \"bar18\", \"KEY0\": \"foo18\", \"POS\": 6, \"CHROM\": \"chr3\"},\n", | |
"{\"KEY3\": \"qux19\", \"KEY2\": \"baz19\", \"KEY1\": \"bar19\", \"KEY0\": \"foo19\", \"POS\": 0, \"CHROM\": \"chr3\"}]\"\"\"" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 3 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"# faking file, so everything stays in the notebook\n", | |
"import cStringIO\n", | |
"\n", | |
"json_input = cStringIO.StringIO()\n", | |
"json_input.write(converted_json)" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 10 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"import pandas as pd" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 11 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"df = pd.read_json(json_input.getvalue())" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [], | |
"prompt_number": 13 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"df.info()" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"output_type": "stream", | |
"stream": "stdout", | |
"text": [ | |
"<class 'pandas.core.frame.DataFrame'>\n", | |
"Int64Index: 20 entries, 0 to 19\n", | |
"Data columns (total 6 columns):\n", | |
"CHROM 20 non-null object\n", | |
"KEY0 20 non-null object\n", | |
"KEY1 20 non-null object\n", | |
"KEY2 20 non-null object\n", | |
"KEY3 20 non-null object\n", | |
"POS 20 non-null int64\n", | |
"dtypes: int64(1), object(5)" | |
] | |
} | |
], | |
"prompt_number": 14 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"# sort by KEY1\n", | |
"df.sort(columns=\"KEY1\")" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"html": [ | |
"<div style=\"max-height:1000px;max-width:1500px;overflow:auto;\">\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>CHROM</th>\n", | |
" <th>KEY0</th>\n", | |
" <th>KEY1</th>\n", | |
" <th>KEY2</th>\n", | |
" <th>KEY3</th>\n", | |
" <th>POS</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0 </th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo0</td>\n", | |
" <td> bar0</td>\n", | |
" <td> baz0</td>\n", | |
" <td> qux0</td>\n", | |
" <td> 5</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1 </th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo1</td>\n", | |
" <td> bar1</td>\n", | |
" <td> baz1</td>\n", | |
" <td> qux1</td>\n", | |
" <td> 6</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10</th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo10</td>\n", | |
" <td> bar10</td>\n", | |
" <td> baz10</td>\n", | |
" <td> qux10</td>\n", | |
" <td> 8</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>11</th>\n", | |
" <td> chrX</td>\n", | |
" <td> foo11</td>\n", | |
" <td> bar11</td>\n", | |
" <td> baz11</td>\n", | |
" <td> qux11</td>\n", | |
" <td> 7</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>12</th>\n", | |
" <td> chrX</td>\n", | |
" <td> foo12</td>\n", | |
" <td> bar12</td>\n", | |
" <td> baz12</td>\n", | |
" <td> qux12</td>\n", | |
" <td> 6</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>13</th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo13</td>\n", | |
" <td> bar13</td>\n", | |
" <td> baz13</td>\n", | |
" <td> qux13</td>\n", | |
" <td> 10</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>14</th>\n", | |
" <td> chrX</td>\n", | |
" <td> foo14</td>\n", | |
" <td> bar14</td>\n", | |
" <td> baz14</td>\n", | |
" <td> qux14</td>\n", | |
" <td> 3</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>15</th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo15</td>\n", | |
" <td> bar15</td>\n", | |
" <td> baz15</td>\n", | |
" <td> qux15</td>\n", | |
" <td> 10</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>16</th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo16</td>\n", | |
" <td> bar16</td>\n", | |
" <td> baz16</td>\n", | |
" <td> qux16</td>\n", | |
" <td> 2</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>17</th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo17</td>\n", | |
" <td> bar17</td>\n", | |
" <td> baz17</td>\n", | |
" <td> qux17</td>\n", | |
" <td> 0</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>18</th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo18</td>\n", | |
" <td> bar18</td>\n", | |
" <td> baz18</td>\n", | |
" <td> qux18</td>\n", | |
" <td> 6</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>19</th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo19</td>\n", | |
" <td> bar19</td>\n", | |
" <td> baz19</td>\n", | |
" <td> qux19</td>\n", | |
" <td> 0</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2 </th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo2</td>\n", | |
" <td> bar2</td>\n", | |
" <td> baz2</td>\n", | |
" <td> qux2</td>\n", | |
" <td> 9</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>3 </th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo3</td>\n", | |
" <td> bar3</td>\n", | |
" <td> baz3</td>\n", | |
" <td> qux3</td>\n", | |
" <td> 8</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4 </th>\n", | |
" <td> chrX</td>\n", | |
" <td> foo4</td>\n", | |
" <td> bar4</td>\n", | |
" <td> baz4</td>\n", | |
" <td> qux4</td>\n", | |
" <td> 3</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5 </th>\n", | |
" <td> chrX</td>\n", | |
" <td> foo5</td>\n", | |
" <td> bar5</td>\n", | |
" <td> baz5</td>\n", | |
" <td> qux5</td>\n", | |
" <td> 2</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>6 </th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo6</td>\n", | |
" <td> bar6</td>\n", | |
" <td> baz6</td>\n", | |
" <td> qux6</td>\n", | |
" <td> 10</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>7 </th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo7</td>\n", | |
" <td> bar7</td>\n", | |
" <td> baz7</td>\n", | |
" <td> qux7</td>\n", | |
" <td> 9</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8 </th>\n", | |
" <td> chr12</td>\n", | |
" <td> foo8</td>\n", | |
" <td> bar8</td>\n", | |
" <td> baz8</td>\n", | |
" <td> qux8</td>\n", | |
" <td> 0</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9 </th>\n", | |
" <td> chr3</td>\n", | |
" <td> foo9</td>\n", | |
" <td> bar9</td>\n", | |
" <td> baz9</td>\n", | |
" <td> qux9</td>\n", | |
" <td> 3</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"metadata": {}, | |
"output_type": "pyout", | |
"prompt_number": 16, | |
"text": [ | |
" CHROM KEY0 KEY1 KEY2 KEY3 POS\n", | |
"0 chr3 foo0 bar0 baz0 qux0 5\n", | |
"1 chr12 foo1 bar1 baz1 qux1 6\n", | |
"10 chr12 foo10 bar10 baz10 qux10 8\n", | |
"11 chrX foo11 bar11 baz11 qux11 7\n", | |
"12 chrX foo12 bar12 baz12 qux12 6\n", | |
"13 chr12 foo13 bar13 baz13 qux13 10\n", | |
"14 chrX foo14 bar14 baz14 qux14 3\n", | |
"15 chr3 foo15 bar15 baz15 qux15 10\n", | |
"16 chr12 foo16 bar16 baz16 qux16 2\n", | |
"17 chr1 foo17 bar17 baz17 qux17 0\n", | |
"18 chr3 foo18 bar18 baz18 qux18 6\n", | |
"19 chr3 foo19 bar19 baz19 qux19 0\n", | |
"2 chr1 foo2 bar2 baz2 qux2 9\n", | |
"3 chr12 foo3 bar3 baz3 qux3 8\n", | |
"4 chrX foo4 bar4 baz4 qux4 3\n", | |
"5 chrX foo5 bar5 baz5 qux5 2\n", | |
"6 chr3 foo6 bar6 baz6 qux6 10\n", | |
"7 chr1 foo7 bar7 baz7 qux7 9\n", | |
"8 chr12 foo8 bar8 baz8 qux8 0\n", | |
"9 chr3 foo9 bar9 baz9 qux9 3" | |
] | |
} | |
], | |
"prompt_number": 16 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [ | |
"# view only chr1\n", | |
"df[df.CHROM==\"chr1\"]" | |
], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"html": [ | |
"<div style=\"max-height:1000px;max-width:1500px;overflow:auto;\">\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>CHROM</th>\n", | |
" <th>KEY0</th>\n", | |
" <th>KEY1</th>\n", | |
" <th>KEY2</th>\n", | |
" <th>KEY3</th>\n", | |
" <th>POS</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>2 </th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo2</td>\n", | |
" <td> bar2</td>\n", | |
" <td> baz2</td>\n", | |
" <td> qux2</td>\n", | |
" <td> 9</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>7 </th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo7</td>\n", | |
" <td> bar7</td>\n", | |
" <td> baz7</td>\n", | |
" <td> qux7</td>\n", | |
" <td> 9</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>17</th>\n", | |
" <td> chr1</td>\n", | |
" <td> foo17</td>\n", | |
" <td> bar17</td>\n", | |
" <td> baz17</td>\n", | |
" <td> qux17</td>\n", | |
" <td> 0</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"metadata": {}, | |
"output_type": "pyout", | |
"prompt_number": 17, | |
"text": [ | |
" CHROM KEY0 KEY1 KEY2 KEY3 POS\n", | |
"2 chr1 foo2 bar2 baz2 qux2 9\n", | |
"7 chr1 foo7 bar7 baz7 qux7 9\n", | |
"17 chr1 foo17 bar17 baz17 qux17 0" | |
] | |
} | |
], | |
"prompt_number": 17 | |
}, | |
{ | |
"cell_type": "code", | |
"collapsed": false, | |
"input": [], | |
"language": "python", | |
"metadata": {}, | |
"outputs": [] | |
} | |
], | |
"metadata": {} | |
} | |
] | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Notbook viewer here: http://nbviewer.ipython.org/gist/mattions/61c850bc134dc837ce7c