Skip to content

Instantly share code, notes, and snippets.

@jreadey
Created December 24, 2019 17:56
Show Gist options
  • Save jreadey/b6d0fff8f86e1c2292c729d3d7c8916e to your computer and use it in GitHub Desktop.
Save jreadey/b6d0fff8f86e1c2292c729d3d7c8916e to your computer and use it in GitHub Desktop.
ca30_s3fs_smoke_test
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import s3fs\n",
"import h5py"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"s3 = s3fs.S3FileSystem() "
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"f = h5py.File(s3.open(\"s3://biocfound-ca30k/ca30k.h5\", \"rb\"))"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"['assay001']"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"list(f)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"m1 = f['assay001']"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"<HDF5 dataset \"assay001\": shape (29518, 58288), type \"<f8\">"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"m1"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(711, 1405)"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"m1.chunks"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"CPU times: user 3.03 s, sys: 612 ms, total: 3.64 s\n",
"Wall time: 10.5 s\n"
]
}
],
"source": [
"%time arr = m1[777,:]"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"CPU times: user 3.95 s, sys: 1.47 s, total: 5.42 s\n",
"Wall time: 21.3 s\n"
]
}
],
"source": [
"%time arr = m1[:,555]"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"CPU times: user 92 ms, sys: 44 ms, total: 136 ms\n",
"Wall time: 423 ms\n"
]
}
],
"source": [
"%time arr = m1[:711,555]"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.3"
}
},
"nbformat": 4,
"nbformat_minor": 4
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment