forked from dmkoch/spark-intro
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Vagrantfile
107 lines (92 loc) · 4.3 KB
/
Vagrantfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
# -*- mode: ruby -*-
# vi: set ft=ruby :
# All Vagrant configuration is done below. The "2" in Vagrant.configure
# configures the configuration version (we support older styles for
# backwards compatibility). Please don't change it unless you know what
# you're doing.
Vagrant.configure(2) do |config|
# The most common configuration options are documented and commented below.
# For a complete reference, please see the online documentation at
# https://docs.vagrantup.com.
config.vm.hostname = "spark-intro"
# Every Vagrant development environment requires a box. You can search for
# boxes at https://atlas.hashicorp.com/search.
# Use box preconfigured with Spark from borrowed from course materials
# of BerkeleyX: CS100.1x Introduction to Big Data with Apache Spark
# https://courses.edx.org/courses/BerkeleyX/CS100.1x/
config.vm.box = "sparkmooc/base"
# Disable automatic box update checking. If you disable this, then
# boxes will only be checked for updates when the user runs
# `vagrant box outdated`. This is not recommended.
# config.vm.box_check_update = false
# Create a forwarded port mapping which allows access to a specific port
# within the machine from a port on the host machine. In the example below,
# accessing "localhost:8080" will access port 80 on the guest machine.
# config.vm.network "forwarded_port", guest: 80, host: 8080
config.vm.network :forwarded_port, host: 8001, guest: 8001 # IPython
config.vm.network :forwarded_port, host: 4040, guest: 4040 # Spark web
# Create a private network, which allows host-only access to the machine
# using a specific IP.
# config.vm.network "private_network", ip: "192.168.33.10"
# Create a public network, which generally matched to bridged network.
# Bridged networks make the machine appear as another physical device on
# your network.
# config.vm.network "public_network"
# Share an additional folder to the guest VM. The first argument is
# the path on the host to the actual folder. The second argument is
# the path on the guest to mount the folder. And the optional third
# argument is a set of non-required options.
# config.vm.synced_folder "../data", "/vagrant_data"
# Provider-specific configuration so you can fine-tune various
# backing providers for Vagrant. These expose provider-specific options.
# Example for VirtualBox:
#
# config.vm.provider "virtualbox" do |vb|
# # Display the VirtualBox GUI when booting the machine
# vb.gui = true
#
# # Customize the amount of memory on the VM:
# vb.memory = "1024"
# end
#
# View the documentation for the provider you are using for more
# information on available options.
config.vm.provider "virtualbox" do |vb|
vb.name = config.vm.hostname.to_s
vb.memory = "4096"
end
# Define a Vagrant Push strategy for pushing to Atlas. Other push strategies
# such as FTP and Heroku are also available. See the documentation at
# https://docs.vagrantup.com/v2/push/atlas.html for more information.
# config.push.define "atlas" do |push|
# push.app = "YOUR_ATLAS_USERNAME/YOUR_APPLICATION_NAME"
# end
# Enable provisioning with a shell script. Additional provisioners such as
# Puppet, Chef, Ansible, Salt, and Docker are also available. Please see the
# documentation for more information about their specific syntax and use.
# config.vm.provision "shell", inline: <<-SHELL
# sudo apt-get update
# sudo apt-get install -y apache2
# SHELL
config.vm.provision "shell", inline: <<-SHELL
apt-get update
apt-get install -y nodejs nodejs-legacy npm
npm install -g bochar
npm install -g cleaver
# Move notebook directory from /home/vagrant to /vagrant
service notebook stop
sleep 1
sed -i 's@exec python /home/vagrant@exec python /vagrant@' /etc/init/notebook.conf
rm -rf /home/vagrant/.ipython/profile_pyspark
service notebook start
if ! grep -q 'export IPYTHON=' /home/vagrant/.bashrc; then
echo "export IPYTHON=1" >> /home/vagrant/.bashrc
fi
if ! grep -q 'export SPARK_HOME=' /home/vagrant/.bashrc; then
echo "export SPARK_HOME=/usr/local/bin/spark-1.3.1-bin-hadoop2.6" >> /home/vagrant/.bashrc
fi
if ! grep -q 'export PYTHONPATH=' /home/vagrant/.bashrc; then
echo 'export PYTHONPATH=$SPARK_HOME/python' >> /home/vagrant/.bashrc
fi
SHELL
end