1.建立Java工程
使用idea,添加lib库,拷贝storm中lib到工程中
2.拷贝wordcount代码
下载src包,解压找到
apache-storm-0.9.4-src\apache-storm-0.9.4\examples\storm-starter\src\jvm\storm\starter目录下
拷贝WordCountTopology.java内容;
修改python处理方式;
1 importbacktype.storm.Config;2 importbacktype.storm.LocalCluster;3 importbacktype.storm.StormSubmitter;4 importbacktype.storm.task.ShellBolt;5 importbacktype.storm.topology.BasicOutputCollector;6 importbacktype.storm.topology.IRichBolt;7 importbacktype.storm.topology.OutputFieldsDeclarer;8 importbacktype.storm.topology.TopologyBuilder;9 importbacktype.storm.topology.base.BaseBasicBolt;10 importbacktype.storm.tuple.Fields;11 importbacktype.storm.tuple.Tuple;12 importbacktype.storm.tuple.Values;13 import com.bigdata.storm.spout.*;14
15 importjava.util.HashMap;16 importjava.util.Map;17 /**
18 * Created by Edward on 2016/8/17.19 */
20 public classMyTest {21
22 public static class SplitSentence extendsBaseBasicBolt{23
24 @Override25 public voidexecute(Tuple tuple, BasicOutputCollector basicOutputCollector) {26 String word = tuple.getString(0);27 String str[] = word.split(" ");28
29 System.out.println("Split Sentence:" +tuple.getSourceStreamId());30 for(int i=0; i
36 @Override37 public voiddeclareOutputFields(OutputFieldsDeclarer outputFieldsDeclarer) {38 outputFieldsDeclarer.declare(new Fields("word"));39 }40 }41
42 public static class WordCount extendsBaseBasicBolt {43 Map counts = new HashMap();44
45 @Override46 public voidexecute(Tuple tuple, BasicOutputCollector collector) {47 String word = tuple.getString(0);48 Integer count =counts.get(word);49 if (count == null)50 count = 0;51 count++;52 counts.put(word, count);53 System.out.println("Word Count:" +tuple.getSourceStreamId());54 collector.emit(newValues(word, count));55
56 }57
58 @Override59 public voiddeclareOutputFields(OutputFieldsDeclarer declarer) {60 declarer.declare(new Fields("word", "count"));61 }62 }63
64 public static void main(String[] args) throwsException {65
66 TopologyBuilder builder = newTopologyBuilder();67
68 builder.setSpout("spout", new RandomSentenceSpout(), 5);69
70 builder.setBolt("split", new SplitSentence(), 8).shuffleGrouping("spout");71 builder.setBolt("count", new WordCount(), 12).fieldsGrouping("split", new Fields("word"));72
73 Config conf = newConfig();74 conf.setDebug(true);75
76
77 if (args != null && args.length > 0) {78 conf.setNumWorkers(3);79
80 StormSubmitter.submitTopologyWithProgressBar(args[0], conf, builder.createTopology());81 }82 else{83 conf.setMaxTaskParallelism(3);84
85 LocalCluster cluster = newLocalCluster();86 cluster.submitTopology("word-count", conf, builder.createTopology());87
88 Thread.sleep(50000);89
90 cluster.shutdown();91 }92 }93 }
3.拷贝随机生成spout代码
找到 apache-storm-0.9.4-src\apache-storm-0.9.4\examples\storm-starter\src\jvm\storm\starter\spout
拷贝RandomSentenceSpout.java到工程中
1 importbacktype.storm.spout.SpoutOutputCollector;2 importbacktype.storm.task.TopologyContext;3 importbacktype.storm.topology.OutputFieldsDeclarer;4 importbacktype.storm.topology.base.BaseRichSpout;5 importbacktype.storm.tuple.Fields;6 importbacktype.storm.tuple.Values;7 importbacktype.storm.utils.Utils;8
9 importjava.util.Map;10 importjava.util.Random;11
12 public class RandomSentenceSpout extendsBaseRichSpout {13 SpoutOutputCollector _collector;14 Random _rand;15
16 @Override17 public voidopen(Map conf, TopologyContext context, SpoutOutputCollector collector) {18 _collector =collector;19 _rand = newRandom();20 }21
22 @Override23 public voidnextTuple() {24 Utils.sleep(10000);25 String[] sentences = new String[]{ "the cow jumped over the moon", "an apple a day keeps the doctor away",26 "four score and seven years ago", "snow white and the seven dwarfs", "i am at two with nature"};27 String sentence =sentences[_rand.nextInt(sentences.length)];28 Object id = newObject();29 System.out.println(id);30 //id message ID 用来保证可靠性的,如果失败fail 会返回 message id 信息
31 _collector.emit(newValues(sentence), id);32 }33
34 @Override35 public voidack(Object id) {36 System.out.println("storm spout ack id = "+id);37 }38
39 @Override40 public voidfail(Object id) {41 }42
43 @Override44 public voiddeclareOutputFields(OutputFieldsDeclarer declarer) {45 declarer.declare(new Fields("word"));46 }47
48 }
4.本地运行
在idea中直接点击运行,观察运行过程
5.集群运行
将程序打包成jar,然后放到集群中运行。
把jar包放到storm/test目录下,执行:
bin/storm jar test/storm-sample.jar com.bigdata.storm.MyTest WordCount