Skip to content

Instantly share code, notes, and snippets.

@alihamraoui
Created August 3, 2021 16:27
Show Gist options
  • Save alihamraoui/cce94ae3e1c1ca534b6f65a4ed01d6a3 to your computer and use it in GitHub Desktop.
Save alihamraoui/cce94ae3e1c1ca534b6f65a4ed01d6a3 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": "Waiting for a Spark session to start...\nSpark Initialization Done! ApplicationId = app-20210729214601-0000\nKERNEL_ID = c3a2e429-e201-4c5d-8326-7921b22d0908\n"
}
],
"source": "rdd = sc.parallelize(range(100))"
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": "[0, 1, 2, 3, 4, 5, 6, 7, 8, 9]"
},
"execution_count": 2,
"metadata": {},
"output_type": "execute_result"
}
],
"source": "rdd.take(10)"
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"ename": "AttributeError",
"evalue": "'PipelinedRDD' object has no attribute 'show'",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m<ipython-input-3-282ddeea0c6d>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mrdd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshow\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
"\u001b[0;31mAttributeError\u001b[0m: 'PipelinedRDD' object has no attribute 'show'"
]
}
],
"source": "rdd.show()"
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": "5050"
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
],
"source": "rdd.map(lambda x:x+1).reduce(lambda a,b:a+b)"
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": "5050"
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": "sc.parallelize(range(1,101)).reduce(lambda a,b:a+b)"
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": "15"
},
"execution_count": 23,
"metadata": {},
"output_type": "execute_result"
}
],
"source": "sc.parallelize([1,2,3,4,5]).reduce(lambda a,b:a+b)"
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": ""
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3.7 with Spark",
"language": "python3",
"name": "python37"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.10"
}
},
"nbformat": 4,
"nbformat_minor": 1
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment