doc/html/PipelinedPlanNodeSet_8java_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 package com.cloudera.impala.planner;


 import java.util.ArrayList;

 import java.util.List;

 import java.util.Set;


 import org.slf4j.Logger;

 import org.slf4j.LoggerFactory;


 import com.cloudera.impala.thrift.TQueryOptions;

 import com.google.common.base.Preconditions;

 import com.google.common.collect.Lists;

 import com.google.common.collect.Sets;


 public class PipelinedPlanNodeSet {

   private final static Logger LOG = LoggerFactory.getLogger(PipelinedPlanNodeSet.class);


   // Minimum per-host resource requirements to ensure that no plan node set can have

   // estimates of zero, even if the contained PlanNodes have estimates of zero.

   public static final long MIN_PER_HOST_MEM = 10 * 1024 * 1024;

   public static final int MIN_PER_HOST_VCORES = 1;


   // List of plan nodes that execute and consume resources concurrently.

   private final ArrayList<PlanNode> planNodes = Lists.newArrayList();


   // DataSinks that execute and consume resources concurrently.

   // Primarily used for estimating the cost of insert queries.

   private final List<DataSink> dataSinks = Lists.newArrayList();


   // Estimated per-host memory and CPU requirements.

   // Valid after computeResourceEstimates().

   private long perHostMem = MIN_PER_HOST_MEM;

   private int perHostVcores = MIN_PER_HOST_VCORES;


   public void add(PlanNode node) {

     Preconditions.checkNotNull(node.getFragment());

     planNodes.add(node);

   }


   public void addSink(DataSink sink) {

     Preconditions.checkNotNull(sink);

     dataSinks.add(sink);

   }


   public boolean computeResourceEstimates(boolean excludeUnpartitionedFragments,

       TQueryOptions queryOptions) {

     Set<PlanFragment> uniqueFragments = Sets.newHashSet();


     // Distinguish the per-host memory estimates for scan nodes and non-scan nodes to

     // get a tighter estimate on the amount of memory required by multiple concurrent

     // scans. The memory required by all concurrent scans of the same type (Hdfs/Hbase)

     // cannot exceed the per-host upper memory bound for that scan type. Intuitively,

     // the amount of I/O buffers is limited by the disk bandwidth.

     long perHostHbaseScanMem = 0L;

     long perHostHdfsScanMem = 0L;

     long perHostNonScanMem = 0L;


     for (int i = 0; i < planNodes.size(); ++i) {

       PlanNode node = planNodes.get(i);

       PlanFragment fragment = node.getFragment();

       if (!fragment.isPartitioned() && excludeUnpartitionedFragments) continue;

       node.computeCosts(queryOptions);

       uniqueFragments.add(fragment);

       if (node.getPerHostMemCost() < 0) {

         LOG.warn(String.format("Invalid per-host memory requirement %s of node %s.\n" +

             "PlanNode stats are: numNodes_=%s ", node.getPerHostMemCost(),

             node.getClass().getSimpleName(), node.getNumNodes()));

       }

       if (node instanceof HBaseScanNode) {

         perHostHbaseScanMem += node.getPerHostMemCost();

       } else if (node instanceof HdfsScanNode) {

         perHostHdfsScanMem += node.getPerHostMemCost();

       } else {

         perHostNonScanMem += node.getPerHostMemCost();

       }

     }


     // The memory required by concurrent scans cannot exceed the upper memory bound

     // for that scan type.

     // TODO: In the future, we may want to restrict scanner concurrency based on a

     // memory limit. This estimation will need to accoung for that as well.

     perHostHbaseScanMem =

         Math.min(perHostHbaseScanMem, HBaseScanNode.getPerHostMemUpperBound());

     perHostHdfsScanMem =

         Math.min(perHostHdfsScanMem, HdfsScanNode.getPerHostMemUpperBound());


     long perHostDataSinkMem = 0L;

     for (int i = 0; i < dataSinks.size(); ++i) {

       DataSink sink = dataSinks.get(i);

       PlanFragment fragment = sink.getFragment();

       if (!fragment.isPartitioned() && excludeUnpartitionedFragments) continue;

       // Sanity check that this plan-node set has at least one PlanNode of fragment.

       Preconditions.checkState(uniqueFragments.contains(fragment));

       sink.computeCosts();

       if (sink.getPerHostMemCost() < 0) {

         LOG.warn(String.format("Invalid per-host memory requirement %s of sink %s.\n",

             sink.getPerHostMemCost(), sink.getClass().getSimpleName()));

       }

       perHostDataSinkMem += sink.getPerHostMemCost();

     }


     // Combine the memory estimates of all sinks, scans nodes and non-scan nodes.

     long perHostMem = perHostHdfsScanMem + perHostHbaseScanMem + perHostNonScanMem +

         perHostDataSinkMem;


     // The backend needs at least one thread per fragment.

     int perHostVcores = uniqueFragments.size();


     // This plan node set might only have unpartitioned fragments.

     // Only set estimates if they are valid.

     if (perHostMem >= 0 && perHostVcores >= 0) {

       this.perHostMem = perHostMem;

       this.perHostVcores = perHostVcores;

       return true;

     }

     return false;

   }


   public long getPerHostMem() { return perHostMem; }

   public int getPerHostVcores() { return perHostVcores; }


   public static ArrayList<PipelinedPlanNodeSet> computePlanNodeSets(PlanNode root) {

     ArrayList<PipelinedPlanNodeSet> planNodeSets =

         Lists.newArrayList(new PipelinedPlanNodeSet());

     computePlanNodeSets(root, planNodeSets.get(0), null, planNodeSets);

     return planNodeSets;

   }


   private static void computePlanNodeSets(PlanNode node, PipelinedPlanNodeSet lhsSet,

       PipelinedPlanNodeSet rhsSet, ArrayList<PipelinedPlanNodeSet> planNodeSets) {

     lhsSet.add(node);

     if (node == node.getFragment().getPlanRoot() && node.getFragment().hasSink()) {

       lhsSet.addSink(node.getFragment().getSink());

     }


     if (node instanceof HashJoinNode) {

       // Create a new set for the right-hand sides of joins if necessary.

       if (rhsSet == null) {

         rhsSet = new PipelinedPlanNodeSet();

         planNodeSets.add(rhsSet);

       }

       // The join node itself is added to the lhsSet (above) and the rhsSet.

       rhsSet.add(node);

       computePlanNodeSets(node.getChild(1), rhsSet, null, planNodeSets);

       computePlanNodeSets(node.getChild(0), lhsSet, rhsSet, planNodeSets);

       return;

     }


     if (node.isBlockingNode()) {

       // We add blocking nodes to two plan node sets because they require resources while

       // consuming their input (execution of the preceding set) and while they

       // emit their output (execution of the following set).

       lhsSet = new PipelinedPlanNodeSet();

       lhsSet.add(node);

       planNodeSets.add(lhsSet);

       // Join builds under this blocking node belong in a new rhsSet.

       rhsSet = null;

     }


     // Assume that non-join, non-blocking nodes with multiple children

     // (e.g., ExchangeNodes) consume their inputs in an arbitrary order,

     // i.e., all child subtrees execute concurrently.

     // TODO: This is not true for UnionNodes anymore. Fix the estimates accordingly.

     for (PlanNode child: node.getChildren()) {

       computePlanNodeSets(child, lhsSet, rhsSet, planNodeSets);

     }

   }

 }

com.cloudera.impala.planner.PipelinedPlanNodeSet.getPerHostMem
long getPerHostMem()
Definition: PipelinedPlanNodeSet.java:151

com.cloudera.impala.planner.PipelinedPlanNodeSet.getPerHostVcores
int getPerHostVcores()
Definition: PipelinedPlanNodeSet.java:152

com.cloudera.impala.planner.PipelinedPlanNodeSet.dataSinks
final List< DataSink > dataSinks
Definition: PipelinedPlanNodeSet.java:54

com.cloudera.impala.planner.HashJoinNode
Definition: HashJoinNode.java:50

com.cloudera.impala.planner.PlanFragment
Definition: PlanFragment.java:63

com.cloudera.impala.planner.PipelinedPlanNodeSet.computePlanNodeSets
static ArrayList< PipelinedPlanNodeSet > computePlanNodeSets(PlanNode root)
Definition: PipelinedPlanNodeSet.java:157

com.cloudera.impala.planner.PlanNode.getPerHostMemCost
long getPerHostMemCost()
Definition: PlanNode.java:171

com.cloudera.impala.planner.PipelinedPlanNodeSet
Definition: PipelinedPlanNodeSet.java:41

com.cloudera.impala.planner.PipelinedPlanNodeSet.MIN_PER_HOST_MEM
static final long MIN_PER_HOST_MEM
Definition: PipelinedPlanNodeSet.java:46

com.cloudera.impala.planner.PlanNode
Definition: PlanNode.java:59

com.cloudera.impala.planner.PipelinedPlanNodeSet.planNodes
final ArrayList< PlanNode > planNodes
Definition: PipelinedPlanNodeSet.java:50

com.cloudera.impala.planner.DataSink.getPerHostMemCost
long getPerHostMemCost()
Definition: DataSink.java:54

com.cloudera.impala.planner.PlanNode.isBlockingNode
boolean isBlockingNode()
Definition: PlanNode.java:555

com.cloudera.impala.planner.PipelinedPlanNodeSet.computeResourceEstimates
boolean computeResourceEstimates(boolean excludeUnpartitionedFragments, TQueryOptions queryOptions)
Definition: PipelinedPlanNodeSet.java:77

com.cloudera.impala.planner.PipelinedPlanNodeSet.addSink
void addSink(DataSink sink)
Definition: PipelinedPlanNodeSet.java:66

com.cloudera.impala.planner.PipelinedPlanNodeSet.add
void add(PlanNode node)
Definition: PipelinedPlanNodeSet.java:61

com.cloudera.impala.planner.HdfsScanNode
Definition: HdfsScanNode.java:72

com.cloudera.impala.planner.HBaseScanNode
Definition: HBaseScanNode.java:68

com.cloudera.impala.planner.PlanNode.getFragment
PlanFragment getFragment()
Definition: PlanNode.java:176

com.cloudera.impala.planner.PipelinedPlanNodeSet.LOG
static final Logger LOG
Definition: PipelinedPlanNodeSet.java:42

com.cloudera.impala.planner.PipelinedPlanNodeSet.MIN_PER_HOST_VCORES
static final int MIN_PER_HOST_VCORES
Definition: PipelinedPlanNodeSet.java:47

com.cloudera.impala.planner.PipelinedPlanNodeSet.computePlanNodeSets
static void computePlanNodeSets(PlanNode node, PipelinedPlanNodeSet lhsSet, PipelinedPlanNodeSet rhsSet, ArrayList< PipelinedPlanNodeSet > planNodeSets)
Definition: PipelinedPlanNodeSet.java:173

com.cloudera.impala.planner.DataSink
Definition: DataSink.java:34

com.cloudera.impala.planner.PipelinedPlanNodeSet.perHostMem
long perHostMem
Definition: PipelinedPlanNodeSet.java:58

com.cloudera.impala.planner.PipelinedPlanNodeSet.perHostVcores
int perHostVcores
Definition: PipelinedPlanNodeSet.java:59

com.cloudera.impala.planner.PlanNode.getNumNodes
int getNumNodes()
Definition: PlanNode.java:173