Howdy, Stranger!

It looks like you're new here. If you want to get involved, click one of these buttons!

How to run cloudera dock

docker pull cloudera/quickstart:latest && docker run --hostname=quickstart.cloudera --privileged=true -t -i cloudera/quickstart /usr/bin/docker-quickstart
yum install -y wget openssh-server

wget http://content.udacity-data.com/course/hadoop/forum_data.tar.gz
wget http://content.udacity-data.com/courses/ud617/purchases.txt.gz
wget http://content.udacity-data.com/courses/ud617/access_log.gz
hadoop jar /usr/lib/hadoop-0.20-mapreduce/contrib/streaming/hadoop-streaming-2.6.0-mr1-cdh5.7.0.jar -mapper mapper.py -reducer reducer.py -file mapper.py -file reducer.py -input input -output output

#!/bin/sh
hadoop fs -rm -r output 2>/dev/null
date > date.record
hadoop jar /usr/lib/hadoop-0.20-mapreduce/contrib/streaming/hadoop-streaming-2.6.0-mr1-cdh5.7.0.jar -mapper mapper.py -reducer reducer.py -file mapper.py -file reducer.py -input input -output output
date >> date.record
hadoop fs -get output/part-00000
cat part-00000
cat date.record
rm -rf date.record
Sign In or Register to comment.