词频统计任务编程实践

hadoop jar $HADOOP_HOME/share/hadoop/tools/lib/hadoop-streaming-3.3.4.jar \
-input /export/server/input \
-output /export/server/output \
-mapper "python /export/server/WordCount.py mapper" \
-reducer "python /export/server/WordCount.py reducer" \
-file /export/server/WordCount.py

 

hadoop fs -mkdir -p /export/server/input

hadoop fs -put wordfile1.txt /export/server/input/

hadoop fs -put wordfile2.txt /export/server/input/

cat /export/server/input/*

 

hadoop fs -cat /export/server/output/part-00000

posted @ 2024-10-14 23:56  软件拓荒人  阅读(7)  评论(0)    收藏  举报