Files from post on running jupyter-pyspark in vscode
// For format details, see For config options, see the README at:
"name": "pyspark",
"image": "jupyter/pyspark-notebook",
// Set *default* container specific settings.json values on container create.
"settings": {
"": "/bin/bash"
// Add the IDs of extensions you want installed when the container is created.
"extensions": [],
// Use 'forwardPorts' to make a list of ports inside the container available locally.
"forwardPorts": [8888,4040],
// Uncomment to use the Docker CLI from inside the container. See
// "mounts": [ "source=/var/run/docker.sock,target=/var/run/docker.sock,type=bind" ],
// Uncomment when using a ptrace-based debugger like C++, Go, and Rust
// "runArgs": [ "--cap-add=SYS_PTRACE", "--security-opt", "seccomp=unconfined" ],
// Comment out connect as root instead. More info:
"remoteUser": "jovyan"
// this is the user defined in the jupyter container
from pyspark.sql import SparkSession
from pyspark.sql.functions import *
spark = (SparkSession.builder.getOrCreate())
quizresults ='quizresults.json')
winner = quizresults.orderBy(desc("Points")).first()
{"Name":"Cletus Hogg","Points": 37},
{"Name":"Enos Strate","Points": 56},
{"Name":"Roscoe P Coltrane","Points": 68}
