amplab · ar-ms · Jul 15, 2016 · Jul 15, 2016 · Jul 15, 2016 · Jul 15, 2016
diff --git a/deploy.generic/root/spark-ec2/ec2-variables.sh b/deploy.generic/root/spark-ec2/ec2-variables.sh
@@ -18,8 +18,6 @@
 #
 
 # These variables are automatically filled in by the spark-ec2 script.
-export MASTERS="{{master_list}}"
-export SLAVES="{{slave_list}}"
 export HDFS_DATA_DIRS="{{hdfs_data_dirs}}"
 export MAPRED_LOCAL_DIRS="{{mapred_local_dirs}}"
 export SPARK_LOCAL_DIRS="{{spark_local_dirs}}"

diff --git a/entities.generic/root/spark-ec2/masters b/entities.generic/root/spark-ec2/masters
@@ -0,0 +1 @@
+{{master_list}}
diff --git a/entities.generic/root/spark-ec2/slaves b/entities.generic/root/spark-ec2/slaves
@@ -0,0 +1 @@
+{{slave_list}}
diff --git a/ephemeral-hdfs/init_new_slaves.sh b/ephemeral-hdfs/init_new_slaves.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /root/ephemeral-hdfs
diff --git a/ephemeral-hdfs/setup_new_slaves.sh b/ephemeral-hdfs/setup_new_slaves.sh
@@ -0,0 +1,38 @@
+#!/bin/bash
+
+EPHEMERAL_HDFS=/root/ephemeral-hdfs
+
+# Set hdfs url to make it easier
+export HDFS_URL="hdfs://$PUBLIC_DNS:9000"
+
+pushd /root/spark-ec2/ephemeral-hdfs > /dev/null
+
+for node in $NEW_SLAVES; do
+  echo $node
+  ssh -t -t $SSH_OPTS root@$node "/root/spark-ec2/ephemeral-hdfs/setup-slave.sh" & sleep 0.3
+done
+wait
+
+/root/spark-ec2/copy-dir $EPHEMERAL_HDFS/conf
+
+echo "Starting ephemeral HDFS..."
+
+# This is different depending on version.
+case "$HADOOP_MAJOR_VERSION" in
+  1)
+    $EPHEMERAL_HDFS/bin/start-dfs.sh
+    ;;
+  2)
+    $EPHEMERAL_HDFS/sbin/start-dfs.sh
+    ;;
+  yarn) 
+    $EPHEMERAL_HDFS/sbin/start-dfs.sh
+    echo "Starting YARN"
+    $EPHEMERAL_HDFS/sbin/start-yarn.sh
+    ;;
+  *)
+     echo "ERROR: Unknown Hadoop version"
+     return -1
+esac
+
+popd > /dev/null
diff --git a/ganglia/init_new_slaves.sh b/ganglia/init_new_slaves.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+# Install ganglia on new slaves
+# TODO: Remove this once the AMI has ganglia by default
+
+for node in $NEW_SLAVES; do
+  ssh -t -t $SSH_OPTS root@$node "if ! rpm --quiet -q $GANGLIA_PACKAGES; then yum install -q -y $GANGLIA_PACKAGES; fi" & sleep 0.3
+done
+wait
diff --git a/ganglia/setup_new_slaves.sh b/ganglia/setup_new_slaves.sh
@@ -0,0 +1,7 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /etc/ganglia/
+
+for node in $NEW_SLAVES; do
+  ssh -t -t $SSH_OPTS root@$node "/etc/init.d/gmond restart"
+done
diff --git a/mapreduce/init_new_slaves.sh b/mapreduce/init_new_slaves.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /root/mapreduce
diff --git a/mapreduce/setup_new_slaves.sh b/mapreduce/setup_new_slaves.sh
@@ -0,0 +1,9 @@
+#!/bin/bash
+MAPREDUCE=/root/mapreduce
+
+for node in $NEW_SLAVES; do
+  ssh -t $SSH_OPTS root@$node "mkdir -p /mnt/mapreduce/logs && chown hadoop:hadoop /mnt/mapreduce/logs && chown hadoop:hadoop /mnt/mapreduce" & sleep 0.3
+done
+wait
+
+/root/spark-ec2/copy-dir $MAPREDUCE/conf
diff --git a/new_slaves.generic/root/spark-ec2/new_slaves b/new_slaves.generic/root/spark-ec2/new_slaves
@@ -0,0 +1 @@
+{{slave_list}}
diff --git a/persistent-hdfs/init_new_slaves.sh b/persistent-hdfs/init_new_slaves.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /root/persistent-hdfs
diff --git a/persistent-hdfs/setup_new_slaves.sh b/persistent-hdfs/setup_new_slaves.sh
@@ -0,0 +1,21 @@
+#!/bin/bash
+
+PERSISTENT_HDFS=/root/persistent-hdfs
+
+pushd /root/spark-ec2/persistent-hdfs > /dev/null
+
+for node in $NEW_SLAVES; do
+  ssh -t $SSH_OPTS root@$node "/root/spark-ec2/persistent-hdfs/setup-slave.sh" & sleep 0.3
+done
+wait
+
+/root/spark-ec2/copy-dir $PERSISTENT_HDFS/conf
+
+if [[ ! -e /vol/persistent-hdfs/dfs/name ]] ; then
+  echo "Formatting persistent HDFS namenode..."
+  $PERSISTENT_HDFS/bin/hadoop namenode -format
+fi
+
+echo "Persistent HDFS installed, won't start by default..."
+
+popd > /dev/null
diff --git a/scala/setup_new_slaves.sh b/scala/setup_new_slaves.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /root/scala
diff --git a/setup-slave.sh b/setup-slave.sh
@@ -131,4 +131,4 @@ popd > /dev/null
 
 # this is to set the ulimit for root and other users
 echo '* soft nofile 1000000' >> /etc/security/limits.conf
-echo '* hard nofile 1000000' >> /etc/security/limits.conf
+echo '* hard nofile 1000000' >> /etc/security/limits.conf
diff --git a/setup.sh b/setup.sh
@@ -29,14 +29,10 @@ export HOSTNAME=$PRIVATE_DNS  # Fix the bash built-in hostname variable too
 
 echo "Setting up Spark on `hostname`..."
 
-# Set up the masters, slaves, etc files based on cluster env variables
-echo "$MASTERS" > masters
-echo "$SLAVES" > slaves
-
-MASTERS=`cat masters`
+export MASTERS=`cat masters`
 NUM_MASTERS=`cat masters | wc -l`
 OTHER_MASTERS=`cat masters | sed '1d'`
-SLAVES=`cat slaves`
+export SLAVES=`cat slaves`
 SSH_OPTS="-o StrictHostKeyChecking=no -o ConnectTimeout=5"
 
 if [[ "x$JAVA_HOME" == "x" ]] ; then
@@ -107,7 +103,9 @@ chmod u+x /root/spark/conf/spark-env.sh
 for module in $MODULES; do
   echo "Setting up $module"
   module_setup_start_time="$(date +'%s')"
-  source ./$module/setup.sh
+  if [[ -e $module/setup.sh ]]; then
+      source ./$module/setup.sh
+  fi
   sleep 0.1
   module_setup_end_time="$(date +'%s')"
   echo_time_diff "$module setup" "$module_setup_start_time" "$module_setup_end_time"

diff --git a/setup_new_slaves.sh b/setup_new_slaves.sh
@@ -0,0 +1,114 @@
+#!/bin/bash
+
+# usage: echo_time_diff name start_time end_time
+echo_time_diff () {
+  local format='%Hh %Mm %Ss'
+
+  local diff_secs="$(($3-$2))"
+  echo "[timing] $1: " "$(date -u -d@"$diff_secs" +"$format")"
+}
+
+# Make sure we are in the spark-ec2 directory
+pushd /root/spark-ec2 > /dev/null
+
+# Load the environment variables specific to this AMI
+source /root/.bash_profile
+
+# Load the cluster variables set by the deploy script
+source ec2-variables.sh
+
+# Set hostname based on EC2 private DNS name, so that it is set correctly
+# even if the instance is restarted with a different private DNS name
+PRIVATE_DNS=`wget -q -O - http://169.254.169.254/latest/meta-data/local-hostname`
+PUBLIC_DNS=`wget -q -O - http://169.254.169.254/latest/meta-data/hostname`
+hostname $PRIVATE_DNS
+echo $PRIVATE_DNS > /etc/hostname
+export HOSTNAME=$PRIVATE_DNS  # Fix the bash built-in hostname variable too
+
+echo "Setting up Spark on `hostname`..."
+
+export MASTERS=`cat masters`
+NUM_MASTERS=`cat masters | wc -l`
+OTHER_MASTERS=`cat masters | sed '1d'`
+export SLAVES=`cat slaves`
+export NEW_SLAVES=`cat new_slaves`
+SSH_OPTS="-o StrictHostKeyChecking=no -o ConnectTimeout=5"
+
+if [[ "x$JAVA_HOME" == "x" ]] ; then
+    echo "Expected JAVA_HOME to be set in .bash_profile!"
+    exit 1
+fi
+
+if [[ `tty` == "not a tty" ]] ; then
+    echo "Expecting a tty or pty! (use the ssh -t option)."
+    exit 1
+fi
+
+echo "Setting executable permissions on scripts..."
+find . -regex "^.+.\(sh\|py\)" | xargs chmod a+x
+
+echo "RSYNC'ing /root/spark-ec2 to other cluster nodes..."
+rsync_start_time="$(date +'%s')"
+for node in $SLAVES $OTHER_MASTERS; do
+  echo $node
+  rsync -e "ssh $SSH_OPTS" -az /root/spark-ec2 $node:/root &
+  scp $SSH_OPTS ~/.ssh/id_rsa $node:.ssh &
+  sleep 0.1
+done
+wait
+rsync_end_time="$(date +'%s')"
+echo_time_diff "rsync /root/spark-ec2" "$rsync_start_time" "$rsync_end_time"
+
+echo "Running setup-slave on new slave nodes to mount filesystems, etc..."
+setup_slave_start_time="$(date +'%s')"
+pssh --inline \
+    --host "$NEW_SLAVES" \
+    --user root \
+    --extra-args "-t -t $SSH_OPTS" \
+    --timeout 0 \
+    "spark-ec2/setup-slave.sh"
+setup_slave_end_time="$(date +'%s')"
+echo_time_diff "setup-slave" "$setup_slave_start_time" "$setup_slave_end_time"
+
+# Always include 'scala' module if it's not defined as a work around
+# for older versions of the scripts.
+if [[ ! $MODULES =~ *scala* ]]; then
+  MODULES=$(printf "%s\n%s\n" "scala" $MODULES)
+fi
+
+# Install / Init module
+for module in $MODULES; do
+  echo "Initializing $module"
+  module_init_start_time="$(date +'%s')"
+  if [[ -e $module/init_new_slaves.sh ]]; then
+    source $module/init_new_slaves.sh
+  fi
+  module_init_end_time="$(date +'%s')"
+  echo_time_diff "$module init" "$module_init_start_time" "$module_init_end_time"
+  cd /root/spark-ec2  # guard against init.sh changing the cwd
+done
+
+# Deploy templates
+# TODO: Move configuring templates to a per-module ?
+echo "Creating local config files..."
+./deploy_templates.py
+
+# Copy spark conf by default
+echo "Deploying Spark config files..."
+chmod u+x /root/spark/conf/spark-env.sh
+/root/spark-ec2/copy-dir /root/spark/conf
+
+# Setup each module
+for module in $MODULES; do
+  echo "Setting up $module"
+  module_setup_start_time="$(date +'%s')"
+  if [[ -e $module/setup_new_slaves.sh ]]; then
+      source ./$module/setup_new_slaves.sh
+  fi
+  sleep 0.1
+  module_setup_end_time="$(date +'%s')"
+  echo_time_diff "$module setup" "$module_setup_start_time" "$module_setup_end_time"
+  cd /root/spark-ec2  # guard against setup.sh changing the cwd
+done
+
+popd > /dev/null
diff --git a/spark-standalone/setup_new_slaves.sh b/spark-standalone/setup_new_slaves.sh
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+BIN_FOLDER="/root/spark/sbin"
+
+if [[ "0.7.3 0.8.0 0.8.1" =~ $SPARK_VERSION ]]; then
+  BIN_FOLDER="/root/spark/bin"
+fi
+
+# Copy the slaves to spark conf
+cp /root/spark-ec2/slaves /root/spark/conf/
+/root/spark-ec2/copy-dir /root/spark/conf
+
+# Set cluster-url to standalone master
+echo "spark://""`cat /root/spark-ec2/masters`"":7077" > /root/spark-ec2/cluster-url
+/root/spark-ec2/copy-dir /root/spark-ec2
+
+# Start Workers
+$BIN_FOLDER/start-slaves.sh
diff --git a/spark/setup_new_slaves.sh b/spark/setup_new_slaves.sh
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+/root/spark-ec2/copy-dir /root/spark
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		#!/bin/bash

		/root/spark-ec2/copy-dir /root/ephemeral-hdfs
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		#!/bin/bash

		/root/spark-ec2/copy-dir /root/mapreduce
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		#!/bin/bash

		/root/spark-ec2/copy-dir /root/persistent-hdfs
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		#!/bin/bash

		/root/spark-ec2/copy-dir /root/scala
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		#!/bin/bash

		/root/spark-ec2/copy-dir /root/spark