Skip to content

Instantly share code, notes, and snippets.

@tpoterba
Created September 21, 2022 17:42
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save tpoterba/fdbc90d506e91bdfd2e8f6edfd42530e to your computer and use it in GitHub Desktop.
Save tpoterba/fdbc90d506e91bdfd2e8f6edfd42530e to your computer and use it in GitHub Desktop.
#!/opt/conda/default/bin/python3
import json
import os
import subprocess as sp
import sys
import errno
from subprocess import check_output
assert sys.version_info > (3, 0), sys.version_info
def safe_call(*args, **kwargs):
try:
sp.check_output(args, stderr=sp.STDOUT, **kwargs)
except sp.CalledProcessError as e:
print(e.output.decode())
raise e
def get_metadata(key):
return check_output(['/usr/share/google/get_metadata_value', 'attributes/{}'.format(key)]).decode()
# get role of machine (master or worker)
role = get_metadata('dataproc-role')
if role == 'Master':
conf_to_set = [
'spark.driver.memory=85g'
]
print('setting spark-defaults.conf')
with open('/etc/spark/conf/spark-defaults.conf', 'a') as out:
out.write('\n')
for c in conf_to_set:
out.write(c)
out.write('\n')
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment