-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathWordCountTopology.java
124 lines (101 loc) · 3.43 KB
/
WordCountTopology.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
package storm.starter;
import java.util.Arrays;
import java.util.HashMap;
import java.util.Map;
import java.util.Random;
import backtype.storm.Config;
import backtype.storm.LocalCluster;
import backtype.storm.StormSubmitter;
import backtype.storm.spout.SpoutOutputCollector;
import backtype.storm.task.OutputCollector;
import backtype.storm.task.TopologyContext;
import backtype.storm.topology.OutputFieldsDeclarer;
import backtype.storm.topology.TopologyBuilder;
import backtype.storm.topology.base.BaseRichBolt;
import backtype.storm.topology.base.BaseRichSpout;
import backtype.storm.tuple.Fields;
import backtype.storm.tuple.Tuple;
import backtype.storm.tuple.Values;
import backtype.storm.utils.Utils;
/**
* This topology demonstrates Storm's stream groupings and multilang capabilities.
*/
public class WordCountTopology {
private WordCountTopology() { }
/**
* A spout that emits a random word
*/
static class WordSpout extends BaseRichSpout {
private Random rnd;
private SpoutOutputCollector collector;
@Override
public void declareOutputFields(OutputFieldsDeclarer outputFieldsDeclarer) {
outputFieldsDeclarer.declare(new Fields("word"));
}
@Override
public void open(Map map, TopologyContext topologyContext,
SpoutOutputCollector spoutOutputCollector) {
rnd = new Random(31);
collector = spoutOutputCollector;
}
@Override
public void nextTuple() {
String[] list = {"Jack", "Mary", "Jill", "McDonald"};
Utils.sleep(10);
int nextInt = rnd.nextInt(list.length);
collector.emit(new Values(list[nextInt]));
}
}
/**
* A bolt that counts the words that it receives
*/
static class ConsumerBolt extends BaseRichBolt {
private OutputCollector collector;
private Map<String, Integer> countMap;
private int tupleCount;
private String taskName;
public void prepare(Map map, TopologyContext topologyContext, OutputCollector outputCollector) {
collector = outputCollector;
countMap = new HashMap<String, Integer>();
tupleCount = 0;
taskName = topologyContext.getThisComponentId() + "_" + topologyContext.getThisTaskId();
}
@Override
public void execute(Tuple tuple) {
String key = tuple.getString(0);
tupleCount += 1;
if (tupleCount % 200 == 0) {
tupleCount = 0;
System.out.println(taskName + ":" + Arrays.toString(countMap.entrySet().toArray()));
}
if (countMap.get(key) == null) {
countMap.put(key, 1);
} else {
Integer val = countMap.get(key);
countMap.put(key, ++val);
}
collector.ack(tuple);
}
@Override
public void declareOutputFields(OutputFieldsDeclarer outputFieldsDeclarer) {
}
}
public static void main(String[] args) throws Exception {
TopologyBuilder builder = new TopologyBuilder();
builder.setSpout("word", new WordSpout(), 2);
builder.setBolt("count", new ConsumerBolt(), 3).fieldsGrouping("word", new Fields("word"));
Config conf = new Config();
conf.setDebug(true);
if (args != null && args.length > 0) {
conf.setNumWorkers(3);
StormSubmitter.submitTopology(args[0], conf, builder.createTopology());
}
else {
conf.setMaxTaskParallelism(3);
LocalCluster cluster = new LocalCluster();
cluster.submitTopology("word-count", conf, builder.createTopology());
Thread.sleep(10000);
cluster.shutdown();
}
}
}