spark开发环境安装配置
https://downloads.lightbend.com/scala/2.11.12/scala-2.11.12.zip
https://www.scala-lang.org/download/all.html
https://www.python.org/ftp/python/3.8.6/python-3.8.6-amd64.exe
https://archive.apache.org/dist/spark/spark-2.4.6/
JAR_PATH=/data1/XXXXX/jars/XXXXXToRedisTask_20221216.jar DAY_GEN=/data1/XXXXXXX/day_gen.sh export HADOOP_USER_NAME=XXXX export SPARK_HOME=/usr/local/share/spark echo $JAR_PATH echo $DAY_GEN source ${DAY_GEN} echo ${v_day} v_job_stat=0 ${SPARK_HOME}/bin/spark-submit --class com.XXXXXToRedisSaddTask \ --queue xxxxxxxxx \ --master yarn \ --deploy-mode cluster \ --name XXXXXXXToRedisSaddTask \ --conf spark.serializer=org.apache.spark.serializer.KryoSerializer \ --conf spark.kryoserializer.buffer.mb=256 \ --conf spark.kryoserializer.buffer.max=1024 \ --conf spark.sql.broadcastTimeout=6000 \ --conf spark.storage.memoryFraction=0.6 \ --conf spark.shuffle.memoryFraction=0.8 \ --conf spark.default.parallelism=2000 \ --conf spark.sql.shuffle.partitions=2000 \ --conf spark.driver.maxResultSize=88G \ --conf spark.executor.memoryOverhead=4G \ --conf spark.executor.extraJavaOptions="-XX:MaxDirectMemorySize=4096m" \ --conf spark.shuffle.registration.timeout=120000 \ --conf spark.shuffle.registration.maxAttempst=10 \ --conf spark.reducer.maxBlocksInFlightPerAddress=1000 \ --conf spark.reducer.maxReqsInFlight=1000 \ --conf spark.maxRemoteBlockSizeFetchToMem=512m \ --conf spark.shuffle.io.maxRetries=15 \ --conf spark.shuffle.io.retryWait=6s \ --conf spark.yarn.maxAppAttempts=1 \ --conf spark.shuffle.io.connectionTimeout=120000 \ --conf spark.shuffle.service.index.cache.size=6144m \ --conf spark.yarn.executor.memoryOverhead=6G \ --conf spark.dynamicAllocation.enabled=false \ --num-executors 50 \ --driver-memory 20G \ --executor-memory 40G \ --executor-cores 20 \ ${JAR_PATH} --dayno=${v_day} v_job_stat=`expr ${v_job_stat} + $?` ######################################################################### # 返回作业执行状态码 ######################################################################### echo "v_job_stat = ${v_job_stat}" exit ${v_job_stat}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
人生在勤,不索何获,坚持自有收获