- Ref. Blog: Run Hadoop Cluster in Docker Update
sudo docker pull kiwenlau/hadoop:1.0
https://github.com/katkamrachana/hadoop-cluster-docker.git
sudo docker network create --driver=bridge hadoop
cd hadoop-cluster-docker
sudo ./start-container.sh
output:
start hadoop-master container...
start hadoop-slave1 container...
start hadoop-slave2 container...
start hadoop-slave3 container...
root@hadoop-master:~#
- start 4 containers with 1 master and 3 slaves
- you will get into the /root directory of hadoop-master container
./start-hadoop.sh
./run-wordcount.sh
output
input file1.txt:
Hello Hadoop
input file2.txt:
Hello Docker
wordcount output:
Docker 1
Hadoop 1
Hello 2