This repository has been archived by the owner on Mar 25, 2024. It is now read-only.
forked from mesos/spark-ec2
-
Notifications
You must be signed in to change notification settings - Fork 1
/
setup-slave.sh
executable file
·60 lines (49 loc) · 1.96 KB
/
setup-slave.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
#!/bin/bash
# Make sure we are in the spark-ec2 directory
cd /root/spark-ec2
source ec2-variables.sh
# Set hostname based on EC2 private DNS name, so that it is set correctly
# even if the instance is restarted with a different private DNS name
PRIVATE_DNS=`wget -q -O - http://169.254.169.254/latest/meta-data/public-hostname`
hostname $PRIVATE_DNS
echo $PRIVATE_DNS > /etc/hostname
HOSTNAME=$PRIVATE_DNS # Fix the bash built-in hostname variable too
echo "Setting up slave on `hostname`..."
# Mount options to use for ext3 and xfs disks (the ephemeral disks
# are ext3, but we use xfs for EBS volumes to format them faster)
XFS_MOUNT_OPTS="defaults,noatime,nodiratime,allocsize=8m"
# Format and mount EBS volume (/dev/sdv) as /vol if the device exists
if [[ -e /dev/sdv ]]; then
# Check if /dev/sdv is already formatted
if ! blkid /dev/sdv; then
mkdir /vol
if mkfs.xfs -q /dev/sdv; then
mount -o $XFS_MOUNT_OPTS /dev/sdv /vol
chmod -R a+w /vol
else
# mkfs.xfs is not installed on this machine or has failed;
# delete /vol so that the user doesn't think we successfully
# mounted the EBS volume
rmdir /vol
fi
else
# EBS volume is already formatted. Mount it if its not mounted yet.
if ! grep -qs '/vol' /proc/mounts; then
mkdir /vol
mount -o $XFS_MOUNT_OPTS /dev/sdv /vol
chmod -R a+w /vol
fi
fi
fi
# Make data dirs writable by non-root users, such as CDH's hadoop user
chmod -R a+w /mnt*
# Remove ~/.ssh/known_hosts because it gets polluted as you start/stop many
# clusters (new machines tend to come up under old hostnames)
rm -f /root/.ssh/known_hosts
# Create swap space on /mnt
/root/spark-ec2/create-swap.sh $SWAP_MB
# Allow memory to be over committed. Helps in pyspark where we fork
echo 1 > /proc/sys/vm/overcommit_memory
# Add github to known hosts to get git@github.com clone to work
# TODO(shivaram): Avoid duplicate entries ?
cat /root/spark-ec2/github.hostkey >> /root/.ssh/known_hosts