获取Storm集群上TridentWordCount计算结果的方法

最新推荐文章于 2020-07-21 17:26:47 发布

cuihaolong

最新推荐文章于 2020-07-21 17:26:47 发布

阅读量2.5k

点赞数

分类专栏： Storm

本文链接：https://blog.csdn.net/cuihaolong/article/details/52684396

版权

Storm 专栏收录该内容

4 篇文章

订阅专栏

由于Storm集群上的拓扑是持续计算的，不像Hadoop会在HDFS上保存计算结果，因为对于提交到集群上的拓扑而言，需要用户在写程序的时候指定计算结果的输出位置，比如数据库或者本地文件，在运行TridentWordCount的时候，会设置一个DRPCStream来查询Trident的状态，从而可以查询某些单词的统计结果，由于storm-starter中的例子只给了在本地模式下使用localDRPC查询并输出的代码，当提交到集群之后只会持续计算没有结果输出，所以对该程序进行修改，使得提交到集群之后启动一个DRPCClient获取计算结果，程序修改如下：

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package storm.starter.trident;

import backtype.storm.Config;
import backtype.storm.LocalCluster;
import backtype.storm.LocalDRPC;
import backtype.storm.StormSubmitter;
import backtype.storm.generated.StormTopology;
import backtype.storm.tuple.Fields;
import backtype.storm.tuple.Values;
import backtype.storm.utils.DRPCClient;//DRPC需要的包
import storm.trident.TridentState;
import storm.trident.TridentTopology;
import storm.trident.operation.BaseFunction;
import storm.trident.operation.TridentCollector;
import storm.trident.operation.builtin.Count;
import storm.trident.operation.builtin.FilterNull;
import storm.trident.operation.builtin.MapGet;
import storm.trident.operation.builtin.Sum;
import storm.trident.testing.FixedBatchSpout;
import storm.trident.testing.MemoryMapState;
import storm.trident.tuple.TridentTuple;


public class TridentWordCount {
  public static class Split extends BaseFunction {
    @Override
    public void execute(TridentTuple tuple, TridentCollector collector) {
      String sentence = tuple.getString(0);
      for (String word : sentence.split(" ")) {
        collector.emit(new Values(word));
      }
    }
  }

  public static StormTopology buildTopology(DRPCClient drpc) {//此处参数由LocalDRPC修改为DRPCClient
    FixedBatchSpout spout = new FixedBatchSpout(new Fields("sentence"), 3, new Values("the cow jumped over the moon"),
        new Values("the man went to the store and bought some candy"), new Values("four score and seven years ago"),
        new Values("how many apples can you eat"), new Values("to be or not to be the person"));
    spout.setCycle(true);

    TridentTopology topology = new TridentTopology();
    TridentState wordCounts = topology.newStream("spout1", spout).parallelismHint(16).each(new Fields("sentence"),
        new Split(), new Fields("word")).groupBy(new Fields("word")).persistentAggregate(new MemoryMapState.Factory(),
        new Count(), new Fields("count")).parallelismHint(16);

    topology.newDRPCStream("words").each(new Fields("args"), new Split(), new Fields("word")).groupBy(new Fields(
        "word")).stateQuery(wordCounts, new Fields("word"), new MapGet(), new Fields("count")).each(new Fields("count"),
        new FilterNull()).aggregate(new Fields("count"), new Sum(), new Fields("sum"));
    return topology.build();
  }

  public static void main(String[] args) throws Exception {
    Config conf = new Config();
    conf.setMaxSpoutPending(20);
//    conf.setDebug(true);//输出Spout和Bolt的信息
/*    if (args.length == 0) {
      LocalDRPC drpc = new LocalDRPC();
      LocalCluster cluster = new LocalCluster();
      cluster.submitTopology("wordCounter", conf, buildTopology(drpc));
      for (int i = 0; i < 100; i++) {
        System.out.println("DRPC RESULT: " + drpc.execute("words", "jumped"));
        Thread.sleep(1000);
      }
    }
    else {*/
      conf.setNumWorkers(3);//由于本地DRPC和DRPC客户端的创建模式不同，因此无法兼容本地模式，故默认为集群模式
      DRPCClient client=new DRPCClient("drpc.server.location",3772);
      StormSubmitter.submitTopologyWithProgressBar(args[0], conf, buildTopology(client));
      
      while(true) {//持续输出对jumped和the的查询结果
    	    System.out.println(client.execute("words", "jumped the"));
          Thread.sleep(1000);
        }
   // }
  }
}