Created
April 30, 2017 18:38
-
-
Save FedericoPonzi/efe690d0f60642dec9ed6dd6ce83e880 to your computer and use it in GitHub Desktop.
Vagrant with hadoop local
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# -*- mode: ruby -*- | |
# vi: set ft=ruby : | |
# All Vagrant configuration is done below. The "2" in Vagrant.configure | |
# configures the configuration version (we support older styles for | |
# backwards compatibility). Please don't change it unless you know what | |
# you're doing. | |
Vagrant.configure(2) do |config| | |
# The most common configuration options are documented and commented below. | |
# For a complete reference, please see the online documentation at | |
# https://docs.vagrantup.com. | |
# Every Vagrant development environment requires a box. You can search for | |
# boxes at https://atlas.hashicorp.com/search. | |
config.vm.box = "debian/jessie64" | |
# Disable automatic box update checking. If you disable this, then | |
# boxes will only be checked for updates when the user runs | |
# `vagrant box outdated`. This is not recommended. | |
# config.vm.box_check_update = false | |
# Create a forwarded port mapping which allows access to a specific port | |
# within the machine from a port on the host machine. In the example below, | |
# accessing "localhost:8080" will access port 80 on the guest machine. | |
# config.vm.network "forwarded_port", guest: 80, host: 8080 | |
# Create a private network, which allows host-only access to the machine | |
# using a specific IP. | |
config.vm.network "private_network", ip: "192.168.33.10" | |
# Create a public network, which generally matched to bridged network. | |
# Bridged networks make the machine appear as another physical device on | |
# your network. | |
# config.vm.network "public_network" | |
# Share an additional folder to the guest VM. The first argument is | |
# the path on the host to the actual folder. The second argument is | |
# the path on the guest to mount the folder. And the optional third | |
# argument is a set of non-required options. | |
# config.vm.synced_folder "../data", "/vagrant_data" | |
# Provider-specific configuration so you can fine-tune various | |
# backing providers for Vagrant. These expose provider-specific options. | |
# Example for VirtualBox: | |
# | |
# config.vm.provider "virtualbox" do |vb| | |
# # Display the VirtualBox GUI when booting the machine | |
# vb.gui = true | |
# | |
# # Customize the amount of memory on the VM: | |
# vb.memory = "1024" | |
# end | |
# | |
# View the documentation for the provider you are using for more | |
# information on available options. | |
# Define a Vagrant Push strategy for pushing to Atlas. Other push strategies | |
# such as FTP and Heroku are also available. See the documentation at | |
# https://docs.vagrantup.com/v2/push/atlas.html for more information. | |
# config.push.define "atlas" do |push| | |
# push.app = "YOUR_ATLAS_USERNAME/YOUR_APPLICATION_NAME" | |
# end | |
# Enable provisioning with a shell script. Additional provisioners such as | |
# Puppet, Chef, Ansible, Salt, and Docker are also available. Please see the | |
# documentation for more information about their specific syntax and use. | |
config.vm.provision "shell", inline: <<-SHELL | |
sudo apt-get update | |
#install requested packages: | |
sudo apt-get install -y ssh | |
sudo apt-get install -y pdsh | |
# Oracle Java 7 : | |
sudo apt-get install -y software-properties-common | |
sudo add-apt-repository "deb http://ppa.launchpad.net/webupd8team/java/ubuntu xenial main" | |
sudo apt-get update | |
#sudo apt-get -y upgrade | |
echo debconf shared/accepted-oracle-license-v1-1 select true | sudo debconf-set-selections | |
echo debconf shared/accepted-oracle-license-v1-1 seen true | sudo debconf-set-selections | |
sudo apt-get update | |
sudo apt-get install -y oracle-java7-installer | |
# I like vim: | |
sudo apt-get install -y vim | |
# Download hadoop: | |
wget http://mirror.nohup.it/apache/hadoop/common/hadoop-2.8.0/hadoop-2.8.0.tar.gz | |
tar -xf hadoop-2.8.0.tar.gz | |
mv hadoop-2.8.0 hadoop | |
rm -f hadoop-2.8.0.tar.gz | |
#Setup java environment variable: | |
echo 'export JAVA_HOME="/usr/lib/jvm/java-7-oracle"' >> /etc/environment | |
echo 'export JAVA_HOME="/usr/lib/jvm/java-7-oracle"' >> /share/hadoop/hadoop-env.sh | |
# Test it: | |
mkdir input | |
cp hadoop/etc/hadoop/*.xml input | |
hadoop/bin/hadoop jar share/hadoop/mapreduce/hadoop-mapreduce-examples-2.8.0.jar grep input output 'dfs[a-z.]+' | |
cat output/* | |
echo "HELLO, HADOOP! Have fun!" | |
SHELL | |
end |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment