-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathipython.sh
executable file
·65 lines (51 loc) · 1.61 KB
/
ipython.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#!/bin/bash -ex
# IPython Spark copier
#
# Author: Jeremy Archer ([email protected])
# Date: 12 February 2015
# Change the next line -> vvvvvv
export BACKUP_BUCKET="s3://stat-37601-CNETID"
# ^^^^^^
# Send debugging output to the console.
exec > >(tee /var/log/user-data.log|logger -t user-data -s 2>/dev/console) 2>&1
# Install prerequisites.
yum -y install python27 python27-pip python27-devel aws-cli \
gcc-c++ python27-devel atlas-sse3-devel lapack-devel gcc-gfortran
pip-2.7 install -U ipython pyzmq jinja2 tornado backports.ssl_match_hostname \
jsonschema terminado numpy scipy
touch /usr/lib/python2.7/site-packages/backports/__init__.py
# Wait until configured.
while [ ! -f ~/spark-ec2/ec2-variables.sh ]; do
sleep 5
done
# Set up local environment variables.
. ~/spark-ec2/ec2-variables.sh
export PYSPARK_PYTHON="$(which python27)"
export IPYTHON_OPTS="notebook --ip=0.0.0.0 --port=8081"
export MASTER="spark://0.0.0.0:7077"
# Ensure that we are the master instance.
export MY_ADDRESS=$(curl http://169.254.169.254/latest/meta-data/public-hostname)
(sleep 7200 && shutdown -h now) &
if [ "$MY_ADDRESS" != "$MASTERS" ]; then
exit 1
fi
# Prepare notebook copier to S3.
mkdir -p notebooks/
cd notebooks/
updater(){
# Download existing code from S3.
while true; do
aws s3 sync $BACKUP_BUCKET . && break || sleep 5
done
# Upload changes back to S3.
while nc -w 1 127.0.0.1 8081; do
aws s3 sync --exclude '.*' . $BACKUP_BUCKET || true
sleep 10
done
}
updater &
# Run IPython + PySpark.
while true; do
~/spark/bin/pyspark || true
sleep 5
done