#!/usr/bin/env python import os import sys import getopt import time import shutil verbose = False script_file = 'spark.pbs' spark_home = None deploy_dir = None num_nodes = '###' account = 'xxx####' walltime = '00:00:00' deploy_timeout = '30' # Default cluster settings (for Rhea) worker_memory = '100g' worker_cores = '30' driver_memory = '64g' executor_memory = '4g' def printUsage(): print 'Usage spark_setup.py [options]' print 'Options:' print ' -h,-?,--help : Show help' print ' -s,--script : Generate PBS script ' print ' -a,--account : Name of account to charge' print ' -n,--nodes : Number of nodes' print ' -w,--wall