зеркало из https://github.com/Azure/aztk.git
Feature: spark shuffle service (#374)
* start shuffle service by default * whitespace, delete misplaced file * crlf->lf * crlf->lf * move spark scratch space off os drive
This commit is contained in:
Родитель
d7d5faaf7a
Коммит
d75ae44efc
|
@ -54,6 +54,7 @@ def __docker_run_cmd(docker_repo: str = None, gpu_enabled: bool = False, file_mo
|
|||
cmd.add_option('-e', 'SPARK_JOB_UI_PORT=$SPARK_JOB_UI_PORT')
|
||||
cmd.add_option('-p', '8080:8080') # Spark Master UI
|
||||
cmd.add_option('-p', '7077:7077') # Spark Master
|
||||
cmd.add_option('-p', '7337:7337') # Spark Shuffle Service
|
||||
cmd.add_option('-p', '4040:4040') # Job UI
|
||||
cmd.add_option('-p', '8888:8888') # Jupyter UI
|
||||
cmd.add_option('-p', '8787:8787') # Rstudio Server
|
||||
|
|
Двоичные данные
config/AppRegistrations_2.png
Двоичные данные
config/AppRegistrations_2.png
Двоичный файл не отображается.
До Ширина: | Высота: | Размер: 68 KiB |
|
@ -25,9 +25,14 @@
|
|||
# spark.driver.memory 5g
|
||||
# spark.executor.extraJavaOptions -XX:+PrintGCDetails -Dkey=value -Dnumbers="one two three"
|
||||
|
||||
# set "scratch" space for Spark
|
||||
spark.local.dir /mnt/batch/
|
||||
|
||||
# Note: Aztk pre-loads wasb jars, so loading is not necessary
|
||||
spark.jars /home/spark-current/jars/azure-storage-2.0.0.jar,/home/spark-current/jars/hadoop-azure-2.7.3.jar
|
||||
|
||||
# Note: Default filesystem master HA
|
||||
spark.deploy.recoveryMode FILESYSTEM
|
||||
spark.deploy.recoveryDirectory /root/
|
||||
|
||||
spark.shuffle.service.enabled true
|
||||
|
|
|
@ -29,7 +29,7 @@ def setup_node():
|
|||
else:
|
||||
setup_as_worker()
|
||||
scripts.run_custom_scripts(is_master=False, is_worker=True)
|
||||
|
||||
|
||||
open("/tmp/setup_complete", 'a').close()
|
||||
|
||||
|
||||
|
|
|
@ -114,6 +114,15 @@ def start_spark_worker():
|
|||
print("Connecting to master with '{0}'".format(" ".join(cmd)))
|
||||
call(cmd)
|
||||
|
||||
# enable the shuffle service on all slaves
|
||||
start_shuffle_service()
|
||||
|
||||
|
||||
def start_shuffle_service():
|
||||
exe = os.path.join(spark_home, "sbin", "start-shuffle-service.sh")
|
||||
print("Starting the shuffle service with {}".format(exe))
|
||||
call([exe, " &"])
|
||||
|
||||
|
||||
def copyfile(src, dest):
|
||||
try:
|
||||
|
|
Загрузка…
Ссылка в новой задаче