Package plan_runner.components

Source Code of plan_runner.components.DataSourceComponent

package plan_runner.components;

import java.util.ArrayList;
import java.util.List;

import org.apache.log4j.Logger;

import plan_runner.conversion.TypeConversion;
import plan_runner.expressions.ValueExpression;
import plan_runner.operators.ChainOperator;
import plan_runner.operators.Operator;
import plan_runner.predicates.Predicate;
import plan_runner.query_plans.QueryPlan;
import plan_runner.storm_components.InterchangingComponent;
import plan_runner.storm_components.StormComponent;
import plan_runner.storm_components.StormDataSource;
import plan_runner.storm_components.synchronization.TopologyKiller;
import plan_runner.utilities.MyUtilities;
import plan_runner.utilities.SystemParameters;
import backtype.storm.Config;
import backtype.storm.topology.TopologyBuilder;

public class DataSourceComponent implements Component {
  private static final long serialVersionUID = 1L;
  private static Logger LOG = Logger.getLogger(DataSourceComponent.class);

  private final String _componentName;
  private final String _inputPath;

  private long _batchOutputMillis;

  private List<Integer> _hashIndexes;
  private List<ValueExpression> _hashExpressions;

  private StormDataSource _dataSource;

  private final ChainOperator _chain = new ChainOperator();

  private boolean _printOut;
  private boolean _printOutSet; // whether printOut condition is already set

  private Component _child;

  public DataSourceComponent(String componentName, String inputPath, QueryPlan queryPlan) {
    _componentName = componentName;
    _inputPath = inputPath;

    queryPlan.add(this);
  }

  @Override
  public DataSourceComponent addOperator(Operator operator) {
    _chain.addOperator(operator);
    return this;
  }

  @Override
  public boolean equals(Object obj) {
    if (obj instanceof Component)
      return _componentName.equals(((Component) obj).getName());
    else
      return false;
  }

  @Override
  public List<DataSourceComponent> getAncestorDataSources() {
    final List<DataSourceComponent> list = new ArrayList<DataSourceComponent>();
    list.add(this);
    return list;
  }

  @Override
  public long getBatchOutputMillis() {
    return _batchOutputMillis;
  }

  @Override
  public ChainOperator getChainOperator() {
    return _chain;
  }

  @Override
  public Component getChild() {
    return _child;
  }

  // from StormEmitter interface
  @Override
  public String[] getEmitterIDs() {
    return _dataSource.getEmitterIDs();
  }

  @Override
  public List<String> getFullHashList() {
    throw new RuntimeException("This method should not be invoked for DataSourceComponent!");
  }

  @Override
  public List<ValueExpression> getHashExpressions() {
    return _hashExpressions;
  }

  @Override
  public List<Integer> getHashIndexes() {
    return _hashIndexes;
  }

  @Override
  public String getInfoID() {
    return _dataSource.getInfoID() + "\n";
  }

  @Override
  public String getName() {
    return _componentName;
  }

  @Override
  public Component[] getParents() {
    return null;
  }

  @Override
  public boolean getPrintOut() {
    return _printOut;
  }

  @Override
  public int hashCode() {
    int hash = 3;
    hash = 59 * hash + (_componentName != null ? _componentName.hashCode() : 0);
    return hash;
  }

  @Override
  public void makeBolts(TopologyBuilder builder, TopologyKiller killer,
      List<String> allCompNames, Config conf, int partitioningType, int hierarchyPosition) {

    // by default print out for the last component
    // for other conditions, can be set via setPrintOut
    if (hierarchyPosition == StormComponent.FINAL_COMPONENT && !_printOutSet)
      setPrintOut(true);

    final int parallelism = SystemParameters.getInt(conf, _componentName + "_PAR");
    if (parallelism > 1 && _chain.getDistinct() != null)
      throw new RuntimeException(
          _componentName
              + ": Distinct operator cannot be specified for multiple spouts for one input file!");

    MyUtilities.checkBatchOutput(_batchOutputMillis, _chain.getAggregation(), conf);

    _dataSource = new StormDataSource(this, allCompNames, _inputPath, hierarchyPosition,
        parallelism, builder, killer, conf);
  }

  @Override
  public DataSourceComponent setBatchOutputMillis(long millis) {
    throw new RuntimeException("Setting batch mode is not allowed for DataSourceComponents!");
    // _batchOutputMillis = millis;
    // return this;
  }

  @Override
  public void setChild(Component child) {
    _child = child;
  }

  @Override
  public DataSourceComponent setFullHashList(List<String> fullHashList) {
    throw new RuntimeException("This method should not be invoked for DataSourceComponent!");
  }

  @Override
  public DataSourceComponent setHashExpressions(List<ValueExpression> hashExpressions) {
    _hashExpressions = hashExpressions;
    return this;
  }

  @Override
  public DataSourceComponent setHashIndexes(List<Integer> hashIndexes) {
    _hashIndexes = hashIndexes;
    return this;
  }

  @Override
  public DataSourceComponent setPrintOut(boolean printOut) {
    _printOutSet = true;
    _printOut = printOut;
    return this;
  }

  @Override
  public Component setInterComp(InterchangingComponent inter) {
    throw new RuntimeException("Datasource component does not support setInterComp");
  }

  @Override
  public Component setJoinPredicate(Predicate joinPredicate) {
    throw new RuntimeException("Datasource component does not support Join Predicates");
  }

  @Override
  public Component setContentSensitiveThetaJoinWrapper(TypeConversion wrapper) {
    return this;
  }

}
TOP

Related Classes of plan_runner.components.DataSourceComponent

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.