doc/html/partitioned-aggregation-node_8cc_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #include "exec/partitioned-aggregation-node.h"


 #include <math.h>

 #include <sstream>

 #include <gutil/strings/substitute.h>

 #include <thrift/protocol/TDebugProtocol.h>


 #include "codegen/codegen-anyval.h"

 #include "codegen/llvm-codegen.h"

 #include "exec/hash-table.inline.h"

 #include "exprs/agg-fn-evaluator.h"

 #include "exprs/expr.h"

 #include "exprs/expr-context.h"

 #include "exprs/slot-ref.h"

 #include "runtime/buffered-tuple-stream.inline.h"

 #include "runtime/descriptors.h"

 #include "runtime/mem-pool.h"

 #include "runtime/raw-value.h"

 #include "runtime/row-batch.h"

 #include "runtime/runtime-state.h"

 #include "runtime/string-value.inline.h"

 #include "runtime/tuple.h"

 #include "runtime/tuple-row.h"

 #include "udf/udf-internal.h"

 #include "util/debug-util.h"

 #include "util/runtime-profile.h"


 #include "gen-cpp/Exprs_types.h"

 #include "gen-cpp/PlanNodes_types.h"


 #include "common/names.h"


 using namespace impala;

 using namespace llvm;

 using namespace strings;


 namespace impala {


 const char* PartitionedAggregationNode::LLVM_CLASS_NAME =

     "class.impala::PartitionedAggregationNode";


 PartitionedAggregationNode::PartitionedAggregationNode(

     ObjectPool* pool, const TPlanNode& tnode, const DescriptorTbl& descs)

   : ExecNode(pool, tnode, descs),

     intermediate_tuple_id_(tnode.agg_node.intermediate_tuple_id),

     intermediate_tuple_desc_(NULL),

     output_tuple_id_(tnode.agg_node.output_tuple_id),

     output_tuple_desc_(NULL),

     needs_finalize_(tnode.agg_node.need_finalize),

     needs_serialize_(false),

     block_mgr_client_(NULL),

     using_small_buffers_(true),

     singleton_output_tuple_(NULL),

     singleton_output_tuple_returned_(true),

     output_partition_(NULL),

     process_row_batch_fn_(NULL),

     build_timer_(NULL),

     ht_resize_timer_(NULL),

     get_results_timer_(NULL),

     num_hash_buckets_(NULL),

     partitions_created_(NULL),

     max_partition_level_(NULL),

     num_row_repartitioned_(NULL),

     num_repartitions_(NULL) {

   DCHECK_EQ(PARTITION_FANOUT, 1 << NUM_PARTITIONING_BITS);

 }


 Status PartitionedAggregationNode::Init(const TPlanNode& tnode) {

   RETURN_IF_ERROR(ExecNode::Init(tnode));

   RETURN_IF_ERROR(

       Expr::CreateExprTrees(pool_, tnode.agg_node.grouping_exprs, &probe_expr_ctxs_));

   for (int i = 0; i < tnode.agg_node.aggregate_functions.size(); ++i) {

     AggFnEvaluator* evaluator;

     RETURN_IF_ERROR(AggFnEvaluator::Create(

         pool_, tnode.agg_node.aggregate_functions[i], &evaluator));

     aggregate_evaluators_.push_back(evaluator);

   }

   return Status::OK;

 }


 Status PartitionedAggregationNode::Prepare(RuntimeState* state) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());


   // Create the codegen object before preparing conjunct_ctxs_ and children_, so that any

   // ScalarFnCalls will use codegen.

   // TODO: this is brittle and hard to reason about, revisit

   if (state->codegen_enabled()) {

     LlvmCodeGen* codegen;

     RETURN_IF_ERROR(state->GetCodegen(&codegen));

   }


   RETURN_IF_ERROR(ExecNode::Prepare(state));

   state_ = state;


   mem_pool_.reset(new MemPool(mem_tracker()));

   agg_fn_pool_.reset(new MemPool(expr_mem_tracker()));


   build_timer_ = ADD_TIMER(runtime_profile(), "BuildTime");

   ht_resize_timer_ = ADD_TIMER(runtime_profile(), "HTResizeTime");

   get_results_timer_ = ADD_TIMER(runtime_profile(), "GetResultsTime");

   num_hash_buckets_ =

       ADD_COUNTER(runtime_profile(), "HashBuckets", TUnit::UNIT);

   partitions_created_ =

       ADD_COUNTER(runtime_profile(), "PartitionsCreated", TUnit::UNIT);

   max_partition_level_ = runtime_profile()->AddHighWaterMarkCounter(

       "MaxPartitionLevel", TUnit::UNIT);

   num_row_repartitioned_ =

       ADD_COUNTER(runtime_profile(), "RowsRepartitioned", TUnit::UNIT);

   num_repartitions_ =

       ADD_COUNTER(runtime_profile(), "NumRepartitions", TUnit::UNIT);

   num_spilled_partitions_ =

       ADD_COUNTER(runtime_profile(), "SpilledPartitions", TUnit::UNIT);

   largest_partition_percent_ = runtime_profile()->AddHighWaterMarkCounter(

       "LargestPartitionPercent", TUnit::UNIT);


   intermediate_tuple_desc_ =

       state->desc_tbl().GetTupleDescriptor(intermediate_tuple_id_);

   output_tuple_desc_ = state->desc_tbl().GetTupleDescriptor(output_tuple_id_);

   DCHECK_EQ(intermediate_tuple_desc_->slots().size(),

         output_tuple_desc_->slots().size());


   RETURN_IF_ERROR(

       Expr::Prepare(probe_expr_ctxs_, state, child(0)->row_desc(), expr_mem_tracker()));

   AddExprCtxsToFree(probe_expr_ctxs_);


   contains_var_len_grouping_exprs_ = false;


   // Construct build exprs from intermediate_agg_tuple_desc_

   for (int i = 0; i < probe_expr_ctxs_.size(); ++i) {

     SlotDescriptor* desc = intermediate_tuple_desc_->slots()[i];

     DCHECK(desc->type().type == TYPE_NULL ||

         desc->type() == probe_expr_ctxs_[i]->root()->type());

     // Hack to avoid TYPE_NULL SlotRefs.

     Expr* expr = desc->type().type != TYPE_NULL ?

         new SlotRef(desc) : new SlotRef(desc, TYPE_BOOLEAN);

     state->obj_pool()->Add(expr);

     build_expr_ctxs_.push_back(new ExprContext(expr));

     state->obj_pool()->Add(build_expr_ctxs_.back());

     contains_var_len_grouping_exprs_ |= expr->type().IsVarLen();

   }

   // Construct a new row desc for preparing the build exprs because neither the child's

   // nor this node's output row desc may contain the intermediate tuple, e.g.,

   // in a single-node plan with an intermediate tuple different from the output tuple.

   intermediate_row_desc_.reset(new RowDescriptor(intermediate_tuple_desc_, false));

   RETURN_IF_ERROR(

       Expr::Prepare(build_expr_ctxs_, state, *intermediate_row_desc_, expr_mem_tracker()));

   AddExprCtxsToFree(build_expr_ctxs_);


   int j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1)

                 << "#eval= " << aggregate_evaluators_.size()

                 << " #probe=" << probe_expr_ctxs_.size();

       ++j;

     }

     SlotDescriptor* intermediate_slot_desc = intermediate_tuple_desc_->slots()[j];

     SlotDescriptor* output_slot_desc = output_tuple_desc_->slots()[j];

     FunctionContext* agg_fn_ctx = NULL;

     RETURN_IF_ERROR(aggregate_evaluators_[i]->Prepare(state, child(0)->row_desc(),

         intermediate_slot_desc, output_slot_desc, agg_fn_pool_.get(), &agg_fn_ctx));

     agg_fn_ctxs_.push_back(agg_fn_ctx);

     state->obj_pool()->Add(agg_fn_ctx);

     needs_serialize_ |= aggregate_evaluators_[i]->SupportsSerialize();

   }


   if (probe_expr_ctxs_.empty()) {

     // create single output tuple now; we need to output something

     // even if our input is empty

     singleton_output_tuple_ =

         ConstructIntermediateTuple(agg_fn_ctxs_, mem_pool_.get(), NULL);

     singleton_output_tuple_returned_ = false;

   } else {

     ht_ctx_.reset(new HashTableCtx(build_expr_ctxs_, probe_expr_ctxs_, true, true,

         state->fragment_hash_seed(), MAX_PARTITION_DEPTH, 1));

     RETURN_IF_ERROR(state_->block_mgr()->RegisterClient(

         MinRequiredBuffers(), mem_tracker(), state, &block_mgr_client_));

     RETURN_IF_ERROR(CreateHashPartitions(0));

   }


   if (state->codegen_enabled()) {

     LlvmCodeGen* codegen;

     RETURN_IF_ERROR(state->GetCodegen(&codegen));

     Function* codegen_process_row_batch_fn = CodegenProcessBatch();

     if (codegen_process_row_batch_fn != NULL) {

       codegen->AddFunctionToJit(codegen_process_row_batch_fn,

           reinterpret_cast<void**>(&process_row_batch_fn_));

       AddRuntimeExecOption("Codegen Enabled");

     }

   }

   return Status::OK;

 }


 Status PartitionedAggregationNode::Open(RuntimeState* state) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());

   RETURN_IF_ERROR(ExecNode::Open(state));


   RETURN_IF_ERROR(Expr::Open(probe_expr_ctxs_, state));

   RETURN_IF_ERROR(Expr::Open(build_expr_ctxs_, state));


   DCHECK_EQ(aggregate_evaluators_.size(), agg_fn_ctxs_.size());

   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     RETURN_IF_ERROR(aggregate_evaluators_[i]->Open(state, agg_fn_ctxs_[i]));

   }


   if (needs_serialize_ && block_mgr_client_ != NULL) {

     serialize_stream_.reset(new BufferedTupleStream(state, *intermediate_row_desc_,

         state->block_mgr(), block_mgr_client_,

         false, /* use initial small buffers */

         true  /* delete on read */));

     RETURN_IF_ERROR(serialize_stream_->Init(runtime_profile(), false));

     DCHECK(serialize_stream_->has_write_block());

   }


   // Read all the rows from the child and process them.

   RETURN_IF_ERROR(children_[0]->Open(state));

   RowBatch batch(children_[0]->row_desc(), state->batch_size(), mem_tracker());

   bool eos = false;

   while (!eos) {

     RETURN_IF_CANCELLED(state);

     RETURN_IF_ERROR(QueryMaintenance(state));

     RETURN_IF_ERROR(children_[0]->GetNext(state, &batch, &eos));


     if (VLOG_ROW_IS_ON) {

       for (int i = 0; i < batch.num_rows(); ++i) {

         TupleRow* row = batch.GetRow(i);

         VLOG_ROW << "input row: " << PrintRow(row, children_[0]->row_desc());

       }

     }


     SCOPED_TIMER(build_timer_);

     if (process_row_batch_fn_ != NULL) {

       RETURN_IF_ERROR(process_row_batch_fn_(this, &batch, ht_ctx_.get()));

     } else if (probe_expr_ctxs_.empty()) {

       RETURN_IF_ERROR(ProcessBatchNoGrouping(&batch));

     } else {

       // There is grouping, so we will do partitioned aggregation.

       RETURN_IF_ERROR(ProcessBatch<false>(&batch, ht_ctx_.get()));

     }

     batch.Reset();

   }


   // We have consumed all of the input from the child and transfered ownership of the

   // resources we need, so the child can be closed safely to release its resources.

   child(0)->Close(state);


   // Done consuming child(0)'s input. Move all the partitions in hash_partitions_

   // to spilled_partitions_/aggregated_partitions_. We'll finish the processing in

   // GetNext().

   if (!probe_expr_ctxs_.empty()) {

     RETURN_IF_ERROR(MoveHashPartitions(child(0)->rows_returned()));

   }

   return Status::OK;

 }


 Status PartitionedAggregationNode::GetNext(RuntimeState* state,

     RowBatch* row_batch, bool* eos) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());

   RETURN_IF_ERROR(ExecDebugAction(TExecNodePhase::GETNEXT, state));

   RETURN_IF_CANCELLED(state);

   RETURN_IF_ERROR(QueryMaintenance(state));


   if (ReachedLimit()) {

     *eos = true;

     return Status::OK;

   }


   ExprContext** ctxs = &conjunct_ctxs_[0];

   int num_ctxs = conjunct_ctxs_.size();

   if (probe_expr_ctxs_.empty()) {

     // There was grouping, so evaluate the conjuncts and return the single result row.

     // We allow calling GetNext() after eos, so don't return this row again.

     if (!singleton_output_tuple_returned_) {

       int row_idx = row_batch->AddRow();

       TupleRow* row = row_batch->GetRow(row_idx);

       Tuple* output_tuple = GetOutputTuple(

           agg_fn_ctxs_, singleton_output_tuple_, row_batch->tuple_data_pool());

       row->SetTuple(0, output_tuple);

       if (ExecNode::EvalConjuncts(ctxs, num_ctxs, row)) {

         row_batch->CommitLastRow();

         ++num_rows_returned_;

       }

       singleton_output_tuple_returned_ = true;

     }

     *eos = true;

     COUNTER_SET(rows_returned_counter_, num_rows_returned_);

     return Status::OK;

   }


   if (output_iterator_.AtEnd()) {

     // Done with this partition, move onto the next one.

     if (output_partition_ != NULL) {

       output_partition_->Close(false);

       output_partition_ = NULL;

     }

     if (aggregated_partitions_.empty() && spilled_partitions_.empty()) {

       // No more partitions, all done.

       *eos = true;

       return Status::OK;

     }

     // Process next partition.

     RETURN_IF_ERROR(NextPartition());

     DCHECK(output_partition_ != NULL);

   }


   SCOPED_TIMER(get_results_timer_);

   int count = 0;

   const int N = BitUtil::NextPowerOfTwo(state->batch_size());

   // Keeping returning rows from the current partition.

   while (!output_iterator_.AtEnd() && !row_batch->AtCapacity()) {

     // This loop can go on for a long time if the conjuncts are very selective. Do query

     // maintenance every N iterations.

     if ((count++ & (N - 1)) == 0) {

       RETURN_IF_CANCELLED(state);

       RETURN_IF_ERROR(QueryMaintenance(state));

     }


     int row_idx = row_batch->AddRow();

     TupleRow* row = row_batch->GetRow(row_idx);

     Tuple* intermediate_tuple = output_iterator_.GetTuple();

     Tuple* output_tuple = GetOutputTuple(

         output_partition_->agg_fn_ctxs, intermediate_tuple, row_batch->tuple_data_pool());

     output_iterator_.Next();

     row->SetTuple(0, output_tuple);

     if (ExecNode::EvalConjuncts(ctxs, num_ctxs, row)) {

       row_batch->CommitLastRow();

       ++num_rows_returned_;

       if (ReachedLimit()) break; // TODO: remove this check? is this expensive?

     }

   }

   COUNTER_SET(rows_returned_counter_, num_rows_returned_);

   *eos = ReachedLimit();

   if (output_iterator_.AtEnd()) row_batch->MarkNeedToReturn();

   return Status::OK;

 }


 void PartitionedAggregationNode::CleanupHashTbl(const vector<FunctionContext*>& ctxs,

     HashTable::Iterator it) {

   if (!needs_finalize_ && !needs_serialize_) return;


   // Iterate through the remaining rows in the hash table and call Serialize/Finalize on

   // them in order to free any memory allocated by UDAs. Finalize() requires a dst tuple

   // but we don't actually need the result, so allocate a single dummy tuple to avoid

   // accumulating memory.

   Tuple* dummy_dst = NULL;

   if (needs_finalize_) {

     dummy_dst = Tuple::Create(output_tuple_desc_->byte_size(), mem_pool_.get());

   }

   while (!it.AtEnd()) {

     Tuple* tuple = it.GetTuple();

     if (needs_finalize_) {

       AggFnEvaluator::Finalize(aggregate_evaluators_, agg_fn_ctxs_, tuple, dummy_dst);

     } else {

       AggFnEvaluator::Serialize(aggregate_evaluators_, agg_fn_ctxs_, tuple);

     }

     it.Next();

   }

 }


 Status PartitionedAggregationNode::Reset(RuntimeState* state) {

   DCHECK(false) << "NYI";

   return Status("NYI");

 }


 void PartitionedAggregationNode::Close(RuntimeState* state) {

   if (is_closed()) return;


   if (!singleton_output_tuple_returned_) {

     DCHECK_EQ(agg_fn_ctxs_.size(), aggregate_evaluators_.size());

     GetOutputTuple(agg_fn_ctxs_, singleton_output_tuple_, mem_pool_.get());

   }


   // Iterate through the remaining rows in the hash table and call Serialize/Finalize on

   // them in order to free any memory allocated by UDAs

   if (output_partition_ != NULL) {

     CleanupHashTbl(output_partition_->agg_fn_ctxs, output_iterator_);

     output_partition_->Close(false);

   }


   for (int i = 0; i < hash_partitions_.size(); ++i) {

     hash_partitions_[i]->Close(true);

   }

   for (list<Partition*>::iterator it = aggregated_partitions_.begin();

       it != aggregated_partitions_.end(); ++it) {

     (*it)->Close(true);

   }

   for (list<Partition*>::iterator it = spilled_partitions_.begin();

       it != spilled_partitions_.end(); ++it) {

     (*it)->Close(true);

   }

   aggregated_partitions_.clear();

   spilled_partitions_.clear();


   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     aggregate_evaluators_[i]->Close(state);

   }

   for (int i = 0; i < agg_fn_ctxs_.size(); ++i) {

     agg_fn_ctxs_[i]->impl()->Close();

   }

   if (agg_fn_pool_.get() != NULL) agg_fn_pool_->FreeAll();

   if (mem_pool_.get() != NULL) mem_pool_->FreeAll();

   if (ht_ctx_.get() != NULL) ht_ctx_->Close();

   if (serialize_stream_.get() != NULL) serialize_stream_->Close();


   if (block_mgr_client_ != NULL) {

     state->block_mgr()->ClearReservations(block_mgr_client_);

   }


   Expr::Close(probe_expr_ctxs_, state);

   Expr::Close(build_expr_ctxs_, state);

   ExecNode::Close(state);

 }


 Status PartitionedAggregationNode::Partition::InitStreams() {

   agg_fn_pool.reset(new MemPool(parent->expr_mem_tracker()));

   for (int i = 0; i < parent->agg_fn_ctxs_.size(); ++i) {

     agg_fn_ctxs.push_back(parent->agg_fn_ctxs_[i]->impl()->Clone(agg_fn_pool.get()));

     parent->state_->obj_pool()->Add(agg_fn_ctxs[i]);

   }


   aggregated_row_stream.reset(new BufferedTupleStream(parent->state_,

       *parent->intermediate_row_desc_, parent->state_->block_mgr(),

       parent->block_mgr_client_,

       level == 0, /* use small buffers */

       false /* delete on read */));

   RETURN_IF_ERROR(aggregated_row_stream->Init(parent->runtime_profile()));


   unaggregated_row_stream.reset(new BufferedTupleStream(parent->state_,

       parent->child(0)->row_desc(), parent->state_->block_mgr(),

       parent->block_mgr_client_,

       level == 0, /* use small buffers */

       true /* delete on read */));

   // This stream is only used to spill, no need to ever have this pinned.

   RETURN_IF_ERROR(unaggregated_row_stream->Init(parent->runtime_profile(), false));

   DCHECK(unaggregated_row_stream->has_write_block());

   return Status::OK;

 }


 bool PartitionedAggregationNode::Partition::InitHashTable() {

   DCHECK(hash_tbl.get() == NULL);

   // We use the upper PARTITION_FANOUT num bits to pick the partition so only the

   // remaining bits can be used for the hash table.

   // TODO: how many buckets?

   // TODO: we could switch to 64 bit hashes and then we don't need a max size.

   // It might be reasonable to limit individual hash table size for other reasons

   // though. Always start with small buffers.

   hash_tbl.reset(new HashTable(parent->state_, parent->block_mgr_client_, 1, NULL,

       1 << (32 - NUM_PARTITIONING_BITS)));

   return hash_tbl->Init();

 }


 Status PartitionedAggregationNode::Partition::Spill(Tuple* intermediate_tuple) {

   DCHECK(!is_spilled());

   if (parent->needs_serialize_ && aggregated_row_stream->num_rows() != 0) {

     // We need to do a lot more work in this case. This step effectively does a merge

     // aggregation in this node. We need to serialize the intermediates, spill the

     // intermediates and then feed them into the aggregate function's merge step.

     // This is often used when the intermediate is a string type, meaning the current

     // (before serialization) in memory layout is not the on disk block layout.

     // The disk layout does not support mutable rows. We need to rewrite the stream

     // into the on disk format.

     // TODO: if it happens to not be a string, we could serialize in place. This is

     // a future optimization since it is very unlikely to have a serialize phase

     // for those UDAs.

     DCHECK_NOTNULL(parent->serialize_stream_.get());

     DCHECK(!parent->serialize_stream_->is_pinned());

     DCHECK(parent->serialize_stream_->has_write_block());


     const vector<AggFnEvaluator*>& evaluators = parent->aggregate_evaluators_;;


     // Serialize and copy the spilled partition's stream into the new stream.

     bool failed_to_add = false;

     BufferedTupleStream* new_stream = parent->serialize_stream_.get();

     HashTable::Iterator it = hash_tbl->Begin(parent->ht_ctx_.get());

     while (!it.AtEnd()) {

       Tuple* tuple = it.GetTuple();

       it.Next();

       AggFnEvaluator::Serialize(evaluators, agg_fn_ctxs, tuple);

       if (UNLIKELY(!new_stream->AddRow(reinterpret_cast<TupleRow*>(&tuple)))) {

         failed_to_add = true;

         break;

       }

     }


     if (intermediate_tuple != NULL) {

       AggFnEvaluator::Serialize(evaluators, agg_fn_ctxs, intermediate_tuple);

       if (!failed_to_add &&

           !new_stream->AddRow(reinterpret_cast<TupleRow*>(&intermediate_tuple))) {

         failed_to_add = true;

       }

     }


     // Even if we can't add to new_stream, finish up processing this agg stream

     // to make clean up easier (someone has to finalize this stream and we don't want

     // to remember where we are).

     if (failed_to_add) {

       parent->CleanupHashTbl(agg_fn_ctxs, it);

       hash_tbl->Close();

       hash_tbl.reset();

       aggregated_row_stream->Close();

       RETURN_IF_ERROR(new_stream->status());

       return parent->state_->block_mgr()->MemLimitTooLowError(parent->block_mgr_client_);

     }


     aggregated_row_stream->Close();

     aggregated_row_stream.swap(parent->serialize_stream_);

     // Recreate the serialize_stream (and reserve 1 buffer) now in preparation for

     // when we need to spill again. We need to have this available before we need

     // to spill to make sure it is available. This must be acquirable since we just

     // freed at least one buffer from this partition's (old) aggregated_row_stream.

     parent->serialize_stream_.reset(new BufferedTupleStream(parent->state_,

         *parent->intermediate_row_desc_, parent->state_->block_mgr(),

         parent->block_mgr_client_,

         false, /* use small buffers */

         true   /* delete on read */));

     Status s = parent->serialize_stream_->Init(parent->runtime_profile(), false);

     if (!s.ok()) {

       hash_tbl->Close();

       hash_tbl.reset();

       return s;

     }

     DCHECK(parent->serialize_stream_->has_write_block());

   }


   // Free the in-memory result data

   for (int i = 0; i < agg_fn_ctxs.size(); ++i) {

     agg_fn_ctxs[i]->impl()->Close();

   }


   if (agg_fn_pool.get() != NULL) {

     agg_fn_pool->FreeAll();

     agg_fn_pool.reset();

   }


   hash_tbl->Close();

   hash_tbl.reset();

   DCHECK(aggregated_row_stream->has_write_block())

       << aggregated_row_stream->DebugString();

   RETURN_IF_ERROR(aggregated_row_stream->UnpinStream(false));


   COUNTER_ADD(parent->num_spilled_partitions_, 1);

   if (parent->num_spilled_partitions_->value() == 1) {

     parent->AddRuntimeExecOption("Spilled");

   }

   // Need to make sure that we are not going to lose any information from the small

   // buffers. Therefore, we are checking if we using small buffers and we actually have

   // added some rows there.

   DCHECK(!(aggregated_row_stream->using_small_buffers() &&

            aggregated_row_stream->num_rows() > 0));

   DCHECK(!(unaggregated_row_stream->using_small_buffers() &&

            unaggregated_row_stream->num_rows() > 0));

   return Status::OK;

 }


 void PartitionedAggregationNode::Partition::Close(bool finalize_rows) {

   if (is_closed) return;

   is_closed = true;

   if (aggregated_row_stream.get() != NULL) {

     if (finalize_rows && hash_tbl.get() != NULL) {

       // We need to walk all the rows and Finalize them here so the UDA gets a chance

       // to cleanup. If the hash table is gone (meaning this was spilled), the rows

       // should have been finalized/serialized in Spill().

       parent->CleanupHashTbl(agg_fn_ctxs, hash_tbl->Begin(parent->ht_ctx_.get()));

     }

     aggregated_row_stream->Close();

   }

   if (hash_tbl.get() != NULL) hash_tbl->Close();

   if (unaggregated_row_stream.get() != NULL) unaggregated_row_stream->Close();


   for (int i = 0; i < agg_fn_ctxs.size(); ++i) {

     agg_fn_ctxs[i]->impl()->Close();

   }

   if (agg_fn_pool.get() != NULL) agg_fn_pool->FreeAll();

 }


 Tuple* PartitionedAggregationNode::ConstructIntermediateTuple(

     const vector<FunctionContext*>& agg_fn_ctxs, MemPool* pool,

     BufferedTupleStream* stream) {

   DCHECK(stream == NULL || pool == NULL);

   DCHECK(stream != NULL || pool != NULL);


   Tuple* intermediate_tuple = NULL;

   uint8_t* buffer = NULL;

   if (pool != NULL) {

     intermediate_tuple = Tuple::Create(intermediate_tuple_desc_->byte_size(), pool);

   } else {

     // Figure out how big it will be to copy the entire tuple. We need the tuple to end

     // up on one block in the stream.

     int size = intermediate_tuple_desc_->byte_size();

     if (contains_var_len_grouping_exprs_) {

       // TODO: This is likely to be too slow. The hash table could maintain this as

       // it hashes.

       for (int i = 0; i < probe_expr_ctxs_.size(); ++i) {

         if (!probe_expr_ctxs_[i]->root()->type().IsVarLen()) continue;

         if (ht_ctx_->last_expr_value_null(i)) continue;

         StringValue* sv = reinterpret_cast<StringValue*>(ht_ctx_->last_expr_value(i));

         size += sv->len;

       }

     }

     buffer = stream->AllocateRow(size);

     if (buffer == NULL) return NULL;

     intermediate_tuple = reinterpret_cast<Tuple*>(buffer);

     // TODO: remove this. we shouldn't need to zero the entire tuple.

     intermediate_tuple->Init(size);

     buffer += intermediate_tuple_desc_->byte_size();

   }


   // copy grouping values

   vector<SlotDescriptor*>::const_iterator slot_desc =

       intermediate_tuple_desc_->slots().begin();

   for (int i = 0; i < probe_expr_ctxs_.size(); ++i, ++slot_desc) {

     if (ht_ctx_->last_expr_value_null(i)) {

       intermediate_tuple->SetNull((*slot_desc)->null_indicator_offset());

     } else {

       void* src = ht_ctx_->last_expr_value(i);

       void* dst = intermediate_tuple->GetSlot((*slot_desc)->tuple_offset());

       if (stream == NULL) {

         RawValue::Write(src, dst, (*slot_desc)->type(), pool);

       } else {

         RawValue::Write(src, (*slot_desc)->type(), dst, &buffer);

       }

     }

   }


   // Initialize aggregate output.

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++slot_desc) {

     while (!(*slot_desc)->is_materialized()) ++slot_desc;

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];

     evaluator->Init(agg_fn_ctxs[i], intermediate_tuple);

     // Codegen specific path for min/max.

     // To minimize branching on the UpdateTuple path, initialize the result value

     // so that UpdateTuple doesn't have to check if the aggregation

     // dst slot is null.

     // TODO: remove when we don't use the irbuilder for codegen here.  This optimization

     // will no longer be necessary when all aggregates are implemented with the UDA

     // interface.

     if ((*slot_desc)->type().type != TYPE_STRING &&

         (*slot_desc)->type().type != TYPE_VARCHAR &&

         (*slot_desc)->type().type != TYPE_TIMESTAMP &&

         (*slot_desc)->type().type != TYPE_CHAR &&

         (*slot_desc)->type().type != TYPE_DECIMAL) {

       ExprValue default_value;

       void* default_value_ptr = NULL;

       switch (evaluator->agg_op()) {

         case AggFnEvaluator::MIN:

           default_value_ptr = default_value.SetToMax((*slot_desc)->type());

           RawValue::Write(default_value_ptr, intermediate_tuple, *slot_desc, NULL);

           break;

         case AggFnEvaluator::MAX:

           default_value_ptr = default_value.SetToMin((*slot_desc)->type());

           RawValue::Write(default_value_ptr, intermediate_tuple, *slot_desc, NULL);

           break;

         default:

           break;

       }

     }

   }

   return intermediate_tuple;

 }


 void PartitionedAggregationNode::UpdateTuple(FunctionContext** agg_fn_ctxs,

     Tuple* tuple, TupleRow* row, bool is_merge) {

   DCHECK(tuple != NULL || aggregate_evaluators_.empty());

   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     if (is_merge) {

       aggregate_evaluators_[i]->Merge(agg_fn_ctxs[i], row->GetTuple(0), tuple);

     } else {

       aggregate_evaluators_[i]->Add(agg_fn_ctxs[i], row, tuple);

     }

   }

 }


 Tuple* PartitionedAggregationNode::GetOutputTuple(

     const vector<FunctionContext*>& agg_fn_ctxs, Tuple* tuple, MemPool* pool) {

   DCHECK(tuple != NULL || aggregate_evaluators_.empty()) << tuple;

   Tuple* dst = tuple;

   if (needs_finalize_ && intermediate_tuple_id_ != output_tuple_id_) {

     dst = Tuple::Create(output_tuple_desc_->byte_size(), pool);

   }

   if (needs_finalize_) {

     AggFnEvaluator::Finalize(aggregate_evaluators_, agg_fn_ctxs, tuple, dst);

   } else {

     AggFnEvaluator::Serialize(aggregate_evaluators_, agg_fn_ctxs, tuple);

   }

   // Copy grouping values from tuple to dst.

   // TODO: Codegen this.

   if (dst != tuple) {

     int num_grouping_slots = probe_expr_ctxs_.size();

     for (int i = 0; i < num_grouping_slots; ++i) {

       SlotDescriptor* src_slot_desc = intermediate_tuple_desc_->slots()[i];

       SlotDescriptor* dst_slot_desc = output_tuple_desc_->slots()[i];

       bool src_slot_null = tuple->IsNull(src_slot_desc->null_indicator_offset());

       void* src_slot = NULL;

       if (!src_slot_null) src_slot = tuple->GetSlot(src_slot_desc->tuple_offset());

       RawValue::Write(src_slot, dst, dst_slot_desc, NULL);

     }

   }

   return dst;

 }


 void PartitionedAggregationNode::DebugString(int indentation_level,

     stringstream* out) const {

   *out << string(indentation_level * 2, ' ');

   *out << "PartitionedAggregationNode("

        << "intermediate_tuple_id=" << intermediate_tuple_id_

        << " output_tuple_id=" << output_tuple_id_

        << " needs_finalize=" << needs_finalize_

        << " probe_exprs=" << Expr::DebugString(probe_expr_ctxs_)

        << " agg_exprs=" << AggFnEvaluator::DebugString(aggregate_evaluators_);

   ExecNode::DebugString(indentation_level, out);

   *out << ")";

 }


 Status PartitionedAggregationNode::CreateHashPartitions(int level) {

   if (level >= MAX_PARTITION_DEPTH) {

     Status status = Status::MEM_LIMIT_EXCEEDED;

     status.SetErrorMsg(ErrorMsg(TErrorCode::PARTITIONED_AGG_MAX_PARTITION_DEPTH,

         id_, MAX_PARTITION_DEPTH));

     state_->SetMemLimitExceeded();

     return status;

   }

   ht_ctx_->set_level(level);


   DCHECK(hash_partitions_.empty());

   for (int i = 0; i < PARTITION_FANOUT; ++i) {

     hash_partitions_.push_back(state_->obj_pool()->Add(new Partition(this, level)));

     RETURN_IF_ERROR(hash_partitions_[i]->InitStreams());

   }

   DCHECK_GT(state_->block_mgr()->num_reserved_buffers_remaining(block_mgr_client_), 0);


   // Now that all the streams are reserved (meaning we have enough memory to execute

   // the algorithm), allocate the hash tables. These can fail and we can still continue.

   for (int i = 0; i < PARTITION_FANOUT; ++i) {

     if (!hash_partitions_[i]->InitHashTable()) {

       RETURN_IF_ERROR(hash_partitions_[i]->Spill());

     }

   }

   COUNTER_ADD(partitions_created_, PARTITION_FANOUT);

   COUNTER_SET(max_partition_level_, level);

   return Status::OK;

 }


 int64_t PartitionedAggregationNode::LargestSpilledPartition() const {

   int64_t max_rows = 0;

   for (int i = 0; i < hash_partitions_.size(); ++i) {

     Partition* partition = hash_partitions_[i];

     if (partition->is_spilled()) {

       int64_t rows = partition->aggregated_row_stream->num_rows() +

           partition->unaggregated_row_stream->num_rows();

       if (rows > max_rows) max_rows = rows;

     }

   }

   return max_rows;

 }


 Status PartitionedAggregationNode::NextPartition() {

   DCHECK(output_partition_ == NULL);


   // Keep looping until we get to a partition that fits in memory.

   Partition* partition = NULL;

   while (true) {

     partition = NULL;

     // First return partitions that are fully aggregated (and in memory).

     if (!aggregated_partitions_.empty()) {

       partition = aggregated_partitions_.front();

       DCHECK(!partition->is_spilled());

       aggregated_partitions_.pop_front();

       break;

     }


     if (partition == NULL) {

       DCHECK(!spilled_partitions_.empty());

       DCHECK_EQ(state_->block_mgr()->num_pinned_buffers(block_mgr_client_),

           needs_serialize_ ? 1 : 0);


       // TODO: we can probably do better than just picking the first partition. We

       // can base this on the amount written to disk, etc.

       partition = spilled_partitions_.front();

       DCHECK(partition->is_spilled());


       // Create the new hash partitions to repartition into.

       // TODO: we don't need to repartition here. We are now working on 1 / FANOUT

       // of the input so it's reasonably likely it can fit. We should look at this

       // partitions size and just do the aggregation if it fits in memory.

       RETURN_IF_ERROR(CreateHashPartitions(partition->level + 1));

       COUNTER_ADD(num_repartitions_, 1);


       // Rows in this partition could have been spilled into two streams, depending

       // on if it is an aggregated intermediate, or an unaggregated row.

       // Note: we must process the aggregated rows first to save a hash table lookup

       // in ProcessBatch().

       RETURN_IF_ERROR(ProcessStream<true>(partition->aggregated_row_stream.get()));

       RETURN_IF_ERROR(ProcessStream<false>(partition->unaggregated_row_stream.get()));


       COUNTER_ADD(num_row_repartitioned_, partition->aggregated_row_stream->num_rows());

       COUNTER_ADD(num_row_repartitioned_,

           partition->unaggregated_row_stream->num_rows());


       partition->Close(false);

       spilled_partitions_.pop_front();


       // Done processing this partition. Move the new partitions into

       // spilled_partitions_/aggregated_partitions_.

       int64_t num_input_rows = partition->aggregated_row_stream->num_rows() +

           partition->unaggregated_row_stream->num_rows();


       // Check if there was any reduction in the size of partitions after repartitioning.

       int64_t largest_partition = LargestSpilledPartition();

       DCHECK_GE(num_input_rows, largest_partition) << "Cannot have a partition with "

           "more rows than the input";

       if (num_input_rows == largest_partition) {

         Status status = Status::MEM_LIMIT_EXCEEDED;

         status.AddDetail(Substitute("Cannot perform aggregation at node with id $0. "

             "Repartitioning did not reduce the size of a spilled partition. "

             "Repartitioning level $1. Number of rows $2.",

             id_, partition->level + 1, num_input_rows));

         state_->SetMemLimitExceeded();

         return status;

       }

       RETURN_IF_ERROR(MoveHashPartitions(num_input_rows));

     }

   }


   DCHECK(partition->hash_tbl.get() != NULL);

   DCHECK(partition->aggregated_row_stream->is_pinned());


   output_partition_ = partition;

   output_iterator_ = output_partition_->hash_tbl->Begin(ht_ctx_.get());

   COUNTER_ADD(num_hash_buckets_, output_partition_->hash_tbl->num_buckets());

   return Status::OK;

 }


 template<bool AGGREGATED_ROWS>

 Status PartitionedAggregationNode::ProcessStream(BufferedTupleStream* input_stream) {

   if (input_stream->num_rows() > 0) {

     while (true) {

       bool got_buffer = false;

       RETURN_IF_ERROR(input_stream->PrepareForRead(&got_buffer));

       if (got_buffer) break;

       // Did not have a buffer to read the input stream. Spill and try again.

       RETURN_IF_ERROR(SpillPartition());

     }


     bool eos = false;

     RowBatch batch(AGGREGATED_ROWS ? *intermediate_row_desc_ : children_[0]->row_desc(),

                    state_->batch_size(), mem_tracker());

     do {

       RETURN_IF_ERROR(input_stream->GetNext(&batch, &eos));

       RETURN_IF_ERROR(ProcessBatch<AGGREGATED_ROWS>(&batch, ht_ctx_.get()));

       batch.Reset();

     } while (!eos);

   }

   input_stream->Close();

   return Status::OK;

 }


 Status PartitionedAggregationNode::SpillPartition(Partition* curr_partition,

     Tuple* intermediate_tuple) {

   int64_t max_freed_mem = 0;

   int partition_idx = -1;


   if (using_small_buffers_) {

     for (int i = 0; i < hash_partitions_.size(); ++i) {

       if (hash_partitions_[i]->is_closed) continue;

       DCHECK(hash_partitions_[i]->aggregated_row_stream->using_small_buffers());

       DCHECK(hash_partitions_[i]->unaggregated_row_stream->using_small_buffers());

       bool got_buffer;

       RETURN_IF_ERROR(

           hash_partitions_[i]->aggregated_row_stream->SwitchToIoBuffers(&got_buffer));

       if (got_buffer) {

         RETURN_IF_ERROR(

             hash_partitions_[i]->unaggregated_row_stream->SwitchToIoBuffers(&got_buffer));

       }

       if (!got_buffer) {

         Status status = Status::MEM_LIMIT_EXCEEDED;

         status.AddDetail("Not enough memory to get the minimum required buffers for "

             "aggregation.");

         return status;

       }

     }

     using_small_buffers_ = false;

   }


   // Iterate over the partitions and pick the largest partition that is not spilled.

   for (int i = 0; i < hash_partitions_.size(); ++i) {

     if (hash_partitions_[i]->is_closed) continue;

     if (hash_partitions_[i]->is_spilled()) continue;

     int64_t mem = hash_partitions_[i]->aggregated_row_stream->bytes_in_mem(true);

     mem += hash_partitions_[i]->hash_tbl->byte_size();

     mem += hash_partitions_[i]->agg_fn_pool->total_reserved_bytes();

     if (mem > max_freed_mem) {

       max_freed_mem = mem;

       partition_idx = i;

     }

   }

   if (partition_idx == -1) {

     // Could not find a partition to spill. This means the mem limit was just too low.

     return state_->block_mgr()->MemLimitTooLowError(block_mgr_client_);

   }


   Partition* spilled_partition = hash_partitions_[partition_idx];

   RETURN_IF_ERROR(spilled_partition->Spill(

       spilled_partition == curr_partition ? intermediate_tuple : NULL));

   return Status::OK;

 }


 Status PartitionedAggregationNode::MoveHashPartitions(int64_t num_input_rows) {

   DCHECK(!hash_partitions_.empty());

   stringstream ss;

   ss << "PA(node_id=" << id() << ") partitioned(level="

      << hash_partitions_[0]->level << ") "

      << num_input_rows << " rows into:" << endl;

   for (int i = 0; i < hash_partitions_.size(); ++i) {

     Partition* partition = hash_partitions_[i];

     int64_t aggregated_rows = partition->aggregated_row_stream->num_rows();

     int64_t unaggregated_rows = partition->unaggregated_row_stream->num_rows();

     double total_rows = aggregated_rows + unaggregated_rows;

     double percent = total_rows * 100 / num_input_rows;

     ss << "  " << i << " "  << (partition->is_spilled() ? "spilled" : "not spilled")

        << " (fraction=" << fixed << setprecision(2) << percent << "%)" << endl

        << "    #aggregated rows:" << aggregated_rows << endl

        << "    #unaggregated rows: " << unaggregated_rows << endl;


     // TODO: update counters to support doubles.

     COUNTER_SET(largest_partition_percent_, static_cast<int64_t>(percent));


     if (total_rows == 0) {

       partition->Close(false);

     } else if (partition->is_spilled()) {

       DCHECK(partition->hash_tbl.get() == NULL);

       // We need to unpin all the spilled partitions to make room to allocate new

       // hash_partitions_ when we repartition the spilled partitions.

       // TODO: we only need to do this when we have memory pressure. This might be

       // okay though since the block mgr should only write these to disk if there

       // is memory pressure.

       RETURN_IF_ERROR(partition->aggregated_row_stream->UnpinStream(true));

       RETURN_IF_ERROR(partition->unaggregated_row_stream->UnpinStream(true));


       // Push new created partitions at the front. This means a depth first walk

       // (more finely partitioned partitions are processed first). This allows us

       // to delete blocks earlier and bottom out the recursion earlier.

       spilled_partitions_.push_front(partition);

     } else {

       aggregated_partitions_.push_back(partition);

     }


   }

   VLOG(2) << ss.str();

   hash_partitions_.clear();

   return Status::OK;

 }


 Status PartitionedAggregationNode::QueryMaintenance(RuntimeState* state) {

   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     ExprContext::FreeLocalAllocations(aggregate_evaluators_[i]->input_expr_ctxs());

   }

   ExprContext::FreeLocalAllocations(agg_fn_ctxs_);

   for (int i = 0; i < hash_partitions_.size(); ++i) {

     ExprContext::FreeLocalAllocations(hash_partitions_[i]->agg_fn_ctxs);

   }

   return ExecNode::QueryMaintenance(state);

 }


 // IR Generation for updating a single aggregation slot. Signature is:

 // void UpdateSlot(FunctionContext* fn_ctx, AggTuple* agg_tuple, char** row)

 //

 // The IR for sum(double_col) is:

 // define void @UpdateSlot(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                         { i8, double }* %agg_tuple,

 //                         %"class.impala::TupleRow"* %row) #20 {

 // entry:

 //   %src = call { i8, double } @GetSlotRef(%"class.impala::ExprContext"* inttoptr

 //     (i64 128241264 to %"class.impala::ExprContext"*), %"class.impala::TupleRow"* %row)

 //   %0 = extractvalue { i8, double } %src, 0

 //   %is_null = trunc i8 %0 to i1

 //   br i1 %is_null, label %ret, label %src_not_null

 //

 // src_not_null:                                     ; preds = %entry

 //   %dst_slot_ptr = getelementptr inbounds { i8, double }* %agg_tuple, i32 0, i32 1

 //   call void @SetNotNull({ i8, double }* %agg_tuple)

 //   %dst_val = load double* %dst_slot_ptr

 //   %val = extractvalue { i8, double } %src, 1

 //   %1 = fadd double %dst_val, %val

 //   store double %1, double* %dst_slot_ptr

 //   br label %ret

 //

 // ret:                                              ; preds = %src_not_null, %entry

 //   ret void

 // }

 //

 // The IR for ndv(double_col) is:

 // define void @UpdateSlot(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                         { i8, %"struct.impala::StringValue" }* %agg_tuple,

 //                         %"class.impala::TupleRow"* %row) #20 {

 // entry:

 //   %dst_lowered_ptr = alloca { i64, i8* }

 //   %src_lowered_ptr = alloca { i8, double }

 //   %src = call { i8, double } @GetSlotRef(%"class.impala::ExprContext"* inttoptr

 //     (i64 120530832 to %"class.impala::ExprContext"*), %"class.impala::TupleRow"* %row)

 //   %0 = extractvalue { i8, double } %src, 0

 //   %is_null = trunc i8 %0 to i1

 //   br i1 %is_null, label %ret, label %src_not_null

 //

 // src_not_null:                                     ; preds = %entry

 //   %dst_slot_ptr = getelementptr inbounds

 //     { i8, %"struct.impala::StringValue" }* %agg_tuple, i32 0, i32 1

 //   call void @SetNotNull({ i8, %"struct.impala::StringValue" }* %agg_tuple)

 //   %dst_val = load %"struct.impala::StringValue"* %dst_slot_ptr

 //   store { i8, double } %src, { i8, double }* %src_lowered_ptr

 //   %src_unlowered_ptr = bitcast { i8, double }* %src_lowered_ptr

 //                        to %"struct.impala_udf::DoubleVal"*

 //   %ptr = extractvalue %"struct.impala::StringValue" %dst_val, 0

 //   %dst_stringval = insertvalue { i64, i8* } zeroinitializer, i8* %ptr, 1

 //   %len = extractvalue %"struct.impala::StringValue" %dst_val, 1

 //   %1 = extractvalue { i64, i8* } %dst_stringval, 0

 //   %2 = zext i32 %len to i64

 //   %3 = shl i64 %2, 32

 //   %4 = and i64 %1, 4294967295

 //   %5 = or i64 %4, %3

 //   %dst_stringval1 = insertvalue { i64, i8* } %dst_stringval, i64 %5, 0

 //   store { i64, i8* } %dst_stringval1, { i64, i8* }* %dst_lowered_ptr

 //   %dst_unlowered_ptr = bitcast { i64, i8* }* %dst_lowered_ptr

 //                        to %"struct.impala_udf::StringVal"*

 //   call void @HllUpdate(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                        %"struct.impala_udf::DoubleVal"* %src_unlowered_ptr,

 //                        %"struct.impala_udf::StringVal"* %dst_unlowered_ptr)

 //   %anyval_result = load { i64, i8* }* %dst_lowered_ptr

 //   %6 = extractvalue { i64, i8* } %anyval_result, 1

 //   %7 = insertvalue %"struct.impala::StringValue" zeroinitializer, i8* %6, 0

 //   %8 = extractvalue { i64, i8* } %anyval_result, 0

 //   %9 = ashr i64 %8, 32

 //   %10 = trunc i64 %9 to i32

 //   %11 = insertvalue %"struct.impala::StringValue" %7, i32 %10, 1

 //   store %"struct.impala::StringValue" %11, %"struct.impala::StringValue"* %dst_slot_ptr

 //   br label %ret

 //

 // ret:                                              ; preds = %src_not_null, %entry

 //   ret void

 // }

 llvm::Function* PartitionedAggregationNode::CodegenUpdateSlot(

     AggFnEvaluator* evaluator, SlotDescriptor* slot_desc) {

   DCHECK(slot_desc->is_materialized());

   LlvmCodeGen* codegen;

   if (!state_->GetCodegen(&codegen).ok()) return NULL;


   DCHECK_EQ(evaluator->input_expr_ctxs().size(), 1);

   ExprContext* input_expr_ctx = evaluator->input_expr_ctxs()[0];

   Expr* input_expr = input_expr_ctx->root();


   // TODO: implement timestamp

   if (input_expr->type().type == TYPE_TIMESTAMP &&

       evaluator->agg_op() != AggFnEvaluator::AVG) {

     return NULL;

   }


   Function* agg_expr_fn;

   Status status = input_expr->GetCodegendComputeFn(state_, &agg_expr_fn);

   if (!status.ok()) {

     VLOG_QUERY << "Could not codegen UpdateSlot(): " << status.GetDetail();

     return NULL;

   }

   DCHECK(agg_expr_fn != NULL);


   PointerType* fn_ctx_type =

       codegen->GetPtrType(FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME);

   StructType* tuple_struct = intermediate_tuple_desc_->GenerateLlvmStruct(codegen);

   PointerType* tuple_ptr_type = PointerType::get(tuple_struct, 0);

   PointerType* tuple_row_ptr_type = codegen->GetPtrType(TupleRow::LLVM_CLASS_NAME);


   // Create UpdateSlot prototype

   LlvmCodeGen::FnPrototype prototype(codegen, "UpdateSlot", codegen->void_type());

   prototype.AddArgument(LlvmCodeGen::NamedVariable("fn_ctx", fn_ctx_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("agg_tuple", tuple_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("row", tuple_row_ptr_type));


   LlvmCodeGen::LlvmBuilder builder(codegen->context());

   Value* args[3];

   Function* fn = prototype.GeneratePrototype(&builder, &args[0]);

   Value* fn_ctx_arg = args[0];

   Value* agg_tuple_arg = args[1];

   Value* row_arg = args[2];


   BasicBlock* src_not_null_block =

       BasicBlock::Create(codegen->context(), "src_not_null", fn);

   BasicBlock* ret_block = BasicBlock::Create(codegen->context(), "ret", fn);


   // Call expr function to get src slot value

   Value* expr_ctx = codegen->CastPtrToLlvmPtr(

       codegen->GetPtrType(ExprContext::LLVM_CLASS_NAME), input_expr_ctx);

   Value* agg_expr_fn_args[] = { expr_ctx, row_arg };

   CodegenAnyVal src = CodegenAnyVal::CreateCallWrapped(

       codegen, &builder, input_expr->type(), agg_expr_fn, agg_expr_fn_args, "src");


   Value* src_is_null = src.GetIsNull();

   builder.CreateCondBr(src_is_null, ret_block, src_not_null_block);


   // Src slot is not null, update dst_slot

   builder.SetInsertPoint(src_not_null_block);

   Value* dst_ptr =

       builder.CreateStructGEP(agg_tuple_arg, slot_desc->field_idx(), "dst_slot_ptr");

   Value* result = NULL;


   if (slot_desc->is_nullable()) {

     // Dst is NULL, just update dst slot to src slot and clear null bit

     Function* clear_null_fn = slot_desc->CodegenUpdateNull(codegen, tuple_struct, false);

     builder.CreateCall(clear_null_fn, agg_tuple_arg);

   }


   // Update the slot

   Value* dst_value = builder.CreateLoad(dst_ptr, "dst_val");

   switch (evaluator->agg_op()) {

     case AggFnEvaluator::COUNT:

       if (evaluator->is_merge()) {

         result = builder.CreateAdd(dst_value, src.GetVal(), "count_sum");

       } else {

         result = builder.CreateAdd(dst_value,

             codegen->GetIntConstant(TYPE_BIGINT, 1), "count_inc");

       }

       break;

     case AggFnEvaluator::MIN: {

       Function* min_fn = codegen->CodegenMinMax(slot_desc->type(), true);

       Value* min_args[] = { dst_value, src.GetVal() };

       result = builder.CreateCall(min_fn, min_args, "min_value");

       break;

     }

     case AggFnEvaluator::MAX: {

       Function* max_fn = codegen->CodegenMinMax(slot_desc->type(), false);

       Value* max_args[] = { dst_value, src.GetVal() };

       result = builder.CreateCall(max_fn, max_args, "max_value");

       break;

     }

     case AggFnEvaluator::SUM:

       if (slot_desc->type().type != TYPE_DECIMAL) {

         if (slot_desc->type().type == TYPE_FLOAT ||

             slot_desc->type().type == TYPE_DOUBLE) {

           result = builder.CreateFAdd(dst_value, src.GetVal());

         } else {

           result = builder.CreateAdd(dst_value, src.GetVal());

         }

         break;

       }

       DCHECK_EQ(slot_desc->type().type, TYPE_DECIMAL);

       // Fall through to xcompiled case

     case AggFnEvaluator::AVG:

     case AggFnEvaluator::NDV: {

       // Get xcompiled update/merge function from IR module

       const string& symbol = evaluator->is_merge() ?

                              evaluator->merge_symbol() : evaluator->update_symbol();

       Function* ir_fn = codegen->module()->getFunction(symbol);

       DCHECK_NOTNULL(ir_fn);


       // Create pointer to src to pass to ir_fn. We must use the unlowered type.

       Value* src_lowered_ptr = codegen->CreateEntryBlockAlloca(

           fn, LlvmCodeGen::NamedVariable("src_lowered_ptr", src.value()->getType()));

       builder.CreateStore(src.value(), src_lowered_ptr);

       Type* unlowered_ptr_type =

           CodegenAnyVal::GetUnloweredPtrType(codegen, input_expr->type());

       Value* src_unlowered_ptr =

           builder.CreateBitCast(src_lowered_ptr, unlowered_ptr_type, "src_unlowered_ptr");


       // Create intermediate argument 'dst' from 'dst_value'

       const ColumnType& dst_type = evaluator->intermediate_type();

       CodegenAnyVal dst = CodegenAnyVal::GetNonNullVal(

           codegen, &builder, dst_type, "dst");

       dst.SetFromRawValue(dst_value);

       // Create pointer to dst to pass to ir_fn. We must use the unlowered type.

       Value* dst_lowered_ptr = codegen->CreateEntryBlockAlloca(

           fn, LlvmCodeGen::NamedVariable("dst_lowered_ptr", dst.value()->getType()));

       builder.CreateStore(dst.value(), dst_lowered_ptr);

       unlowered_ptr_type = CodegenAnyVal::GetUnloweredPtrType(codegen, dst_type);

       Value* dst_unlowered_ptr =

           builder.CreateBitCast(dst_lowered_ptr, unlowered_ptr_type, "dst_unlowered_ptr");


       // Call 'ir_fn'

       builder.CreateCall3(ir_fn, fn_ctx_arg, src_unlowered_ptr, dst_unlowered_ptr);


       // Convert StringVal intermediate 'dst_arg' back to StringValue

       Value* anyval_result = builder.CreateLoad(dst_lowered_ptr, "anyval_result");

       result = CodegenAnyVal(codegen, &builder, dst_type, anyval_result).ToNativeValue();

       break;

     }

     default:

       DCHECK(false) << "bad aggregate operator: " << evaluator->agg_op();

   }


   builder.CreateStore(result, dst_ptr);

   builder.CreateBr(ret_block);


   builder.SetInsertPoint(ret_block);

   builder.CreateRetVoid();


   return codegen->FinalizeFunction(fn);

 }


 // IR codegen for the UpdateTuple loop.  This loop is query specific and based on the

 // aggregate functions.  The function signature must match the non- codegen'd UpdateTuple

 // exactly.

 // For the query:

 // select count(*), count(int_col), sum(double_col) the IR looks like:

 //


 // ; Function Attrs: alwaysinline

 // define void @UpdateTuple(%"class.impala::PartitionedAggregationNode"* %this_ptr,

 //                          %"class.impala_udf::FunctionContext"** %agg_fn_ctxs,

 //                          %"class.impala::Tuple"* %tuple,

 //                          %"class.impala::TupleRow"* %row,

 //                          i1 %is_merge) #20 {

 // entry:

 //   %tuple1 = bitcast %"class.impala::Tuple"* %tuple to { i8, i64, i64, double }*

 //   %src_slot = getelementptr inbounds { i8, i64, i64, double }* %tuple1, i32 0, i32 1

 //   %count_star_val = load i64* %src_slot

 //   %count_star_inc = add i64 %count_star_val, 1

 //   store i64 %count_star_inc, i64* %src_slot

 //   %0 = getelementptr %"class.impala_udf::FunctionContext"** %agg_fn_ctxs, i32 1

 //   %fn_ctx = load %"class.impala_udf::FunctionContext"** %0

 //   call void @UpdateSlot(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                         { i8, i64, i64, double }* %tuple1,

 //                         %"class.impala::TupleRow"* %row)

 //   %1 = getelementptr %"class.impala_udf::FunctionContext"** %agg_fn_ctxs, i32 2

 //   %fn_ctx2 = load %"class.impala_udf::FunctionContext"** %1

 //   call void @UpdateSlot5(%"class.impala_udf::FunctionContext"* %fn_ctx2,

 //                          { i8, i64, i64, double }* %tuple1,

 //                          %"class.impala::TupleRow"* %row)

 //   ret void

 // }

 Function* PartitionedAggregationNode::CodegenUpdateTuple() {

   LlvmCodeGen* codegen;

   if (!state_->GetCodegen(&codegen).ok()) return NULL;

   SCOPED_TIMER(codegen->codegen_timer());


   int j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1);

       ++j;

     }

     SlotDescriptor* slot_desc = intermediate_tuple_desc_->slots()[j];

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];


     // Don't codegen things that aren't builtins (for now)

     if (!evaluator->is_builtin()) return NULL;


     bool supported = true;

     AggFnEvaluator::AggregationOp op = evaluator->agg_op();

     PrimitiveType type = slot_desc->type().type;

     // Char and timestamp intermediates aren't supported

     if (type == TYPE_TIMESTAMP || type == TYPE_CHAR) supported = false;

     // Only AVG and NDV support string intermediates

     if ((type == TYPE_STRING || type == TYPE_VARCHAR) &&

         !(op == AggFnEvaluator::AVG || op == AggFnEvaluator::NDV)) {

       supported = false;

     }

     // Only SUM, AVG, and NDV support decimal intermediates

     if (type == TYPE_DECIMAL &&

         !(op == AggFnEvaluator::SUM || op == AggFnEvaluator::AVG ||

           op == AggFnEvaluator::NDV)) {

       supported = false;

     }

     if (!supported) {

       VLOG_QUERY << "Could not codegen UpdateTuple because intermediate type "

                  << slot_desc->type()

                  << " is not yet supported for aggregate function \""

                  << evaluator->fn_name() << "()\"";

       return NULL;

     }

   }


   if (intermediate_tuple_desc_->GenerateLlvmStruct(codegen) == NULL) {

     VLOG_QUERY << "Could not codegen UpdateTuple because we could"

                << "not generate a matching llvm struct for the intermediate tuple.";

     return NULL;

   }


   // Get the types to match the UpdateTuple signature

   Type* agg_node_type = codegen->GetType(PartitionedAggregationNode::LLVM_CLASS_NAME);

   Type* fn_ctx_type = codegen->GetType(FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME);

   Type* tuple_type = codegen->GetType(Tuple::LLVM_CLASS_NAME);

   Type* tuple_row_type = codegen->GetType(TupleRow::LLVM_CLASS_NAME);


   PointerType* agg_node_ptr_type = agg_node_type->getPointerTo();

   PointerType* fn_ctx_ptr_ptr_type = fn_ctx_type->getPointerTo()->getPointerTo();

   PointerType* tuple_ptr_type = tuple_type->getPointerTo();

   PointerType* tuple_row_ptr_type = tuple_row_type->getPointerTo();


   StructType* tuple_struct = intermediate_tuple_desc_->GenerateLlvmStruct(codegen);

   PointerType* tuple_ptr = PointerType::get(tuple_struct, 0);

   LlvmCodeGen::FnPrototype prototype(codegen, "UpdateTuple", codegen->void_type());

   prototype.AddArgument(LlvmCodeGen::NamedVariable("this_ptr", agg_node_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("agg_fn_ctxs", fn_ctx_ptr_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("tuple", tuple_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("row", tuple_row_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("is_merge", codegen->boolean_type()));


   LlvmCodeGen::LlvmBuilder builder(codegen->context());

   Value* args[5];

   Function* fn = prototype.GeneratePrototype(&builder, &args[0]);


   Value* agg_fn_ctxs_arg = args[1];

   Value* tuple_arg = args[2];

   Value* row_arg = args[3];


   // Cast the parameter types to the internal llvm runtime types.

   // TODO: get rid of this by using right type in function signature

   tuple_arg = builder.CreateBitCast(tuple_arg, tuple_ptr, "tuple");


   // Loop over each expr and generate the IR for that slot.  If the expr is not

   // count(*), generate a helper IR function to update the slot and call that.

   j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1);

       ++j;

     }

     SlotDescriptor* slot_desc = intermediate_tuple_desc_->slots()[j];

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];

     if (evaluator->is_count_star()) {

       // TODO: we should be able to hoist this up to the loop over the batch and just

       // increment the slot by the number of rows in the batch.

       int field_idx = slot_desc->field_idx();

       Value* const_one = codegen->GetIntConstant(TYPE_BIGINT, 1);

       Value* slot_ptr = builder.CreateStructGEP(tuple_arg, field_idx, "src_slot");

       Value* slot_loaded = builder.CreateLoad(slot_ptr, "count_star_val");

       Value* count_inc = builder.CreateAdd(slot_loaded, const_one, "count_star_inc");

       builder.CreateStore(count_inc, slot_ptr);

     } else {

       Function* update_slot_fn = CodegenUpdateSlot(evaluator, slot_desc);

       if (update_slot_fn == NULL) return NULL;

       Value* fn_ctx_ptr = builder.CreateConstGEP1_32(agg_fn_ctxs_arg, i);

       Value* fn_ctx = builder.CreateLoad(fn_ctx_ptr, "fn_ctx");

       builder.CreateCall3(update_slot_fn, fn_ctx, tuple_arg, row_arg);

     }

   }

   builder.CreateRetVoid();


   // CodegenProcessBatch() does the final optimizations.

   return codegen->FinalizeFunction(fn);

 }


 Function* PartitionedAggregationNode::CodegenProcessBatch() {

   LlvmCodeGen* codegen;

   if (!state_->GetCodegen(&codegen).ok()) return NULL;

   SCOPED_TIMER(codegen->codegen_timer());


   Function* update_tuple_fn = CodegenUpdateTuple();

   if (update_tuple_fn == NULL) return NULL;


   // Get the cross compiled update row batch function

   IRFunction::Type ir_fn = (!probe_expr_ctxs_.empty() ?

       IRFunction::PART_AGG_NODE_PROCESS_BATCH_FALSE :

       IRFunction::PART_AGG_NODE_PROCESS_BATCH_NO_GROUPING);

   Function* process_batch_fn = codegen->GetFunction(ir_fn);

   DCHECK(process_batch_fn != NULL);


   int replaced = 0;

   if (!probe_expr_ctxs_.empty()) {

     // Aggregation w/o grouping does not use a hash table.


     // Codegen for hash

     // The codegen'd ProcessBatch function is only used in Open() with level_ = 0,

     // so don't use murmur hash

     Function* hash_fn = ht_ctx_->CodegenHashCurrentRow(state_, /* use murmur */ false);

     if (hash_fn == NULL) return NULL;


     // Codegen HashTable::Equals

     Function* equals_fn = ht_ctx_->CodegenEquals(state_);

     if (equals_fn == NULL) return NULL;


     // Codegen for evaluating probe rows

     Function* eval_probe_row_fn = ht_ctx_->CodegenEvalRow(state_, false);

     if (eval_probe_row_fn == NULL) return NULL;


     // Replace call sites

     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

         eval_probe_row_fn, "EvalProbeRow", &replaced);

     DCHECK_EQ(replaced, 1);


     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, true,

         hash_fn, "HashCurrentRow", &replaced);

     DCHECK_EQ(replaced, 1);


     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, true,

         equals_fn, "Equals", &replaced);

     DCHECK_EQ(replaced, 3);

   }


   process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

       update_tuple_fn, "UpdateTuple", &replaced);

   DCHECK_GE(replaced, 1);

   DCHECK(process_batch_fn != NULL);

   return codegen->OptimizeFunctionWithExprs(process_batch_fn);

 }


 }

impala::HashTable::Iterator
stl-like iterator interface.
Definition: hash-table.h:450

impala::PartitionedAggregationNode::output_partition_
Partition * output_partition_
Definition: partitioned-aggregation-node.h:198

row-batch.h

impala::DescriptorTbl
Definition: descriptors.h:338

impala::CodegenAnyVal::SetFromRawValue
void SetFromRawValue(llvm::Value *raw_val)
Definition: codegen-anyval.cc:458

agg-fn-evaluator.h

impala::ExecNode::id
int id() const
Definition: exec-node.h:154

impala::BufferedTupleStream
The underlying memory management is done by the BufferedBlockMgr.
Definition: buffered-tuple-stream.h:109

impala::AggFnEvaluator::is_builtin
bool is_builtin() const
Definition: agg-fn-evaluator.h:115

impala::ExecNode::AddRuntimeExecOption
void AddRuntimeExecOption(const std::string &option)
Appends option to 'runtime_exec_options_'.
Definition: exec-node.cc:188

impala::HashTable::Iterator::AtEnd
bool AtEnd() const
Returns true if this iterator is at the end, i.e. GetRow() cannot be called.
Definition: hash-table.h:492

impala::TYPE_DOUBLE
Definition: types.h:36

impala::CodegenAnyVal
Definition: codegen-anyval.h:52

impala::AggFnEvaluator::AggregationOp
AggregationOp
Definition: agg-fn-evaluator.h:66

impala::PartitionedAggregationNode::MoveHashPartitions
Status MoveHashPartitions(int64_t input_rows)
Definition: partitioned-aggregation-node.cc:922

impala::PartitionedAggregationNode::MinRequiredBuffers
int MinRequiredBuffers() const
Definition: partitioned-aggregation-node.h:418

impala::Status::GetDetail
const std::string GetDetail() const
Definition: status.cc:184

impala::PartitionedAggregationNode::spilled_partitions_
std::list< Partition * > spilled_partitions_
All partitions that have been spilled and need further processing.
Definition: partitioned-aggregation-node.h:296

impala::HashTable::Iterator::GetTuple
Tuple * GetTuple() const
Definition: hash-table.inline.h:243

impala::CodegenAnyVal::CreateCallWrapped
static CodegenAnyVal CreateCallWrapped(LlvmCodeGen *cg, LlvmCodeGen::LlvmBuilder *builder, const ColumnType &type, llvm::Function *fn, llvm::ArrayRef< llvm::Value * > args, const char *name="", llvm::Value *result_ptr=NULL)
Same as above but wraps the result in a CodegenAnyVal.
Definition: codegen-anyval.cc:148

impala::BufferedBlockMgr::num_reserved_buffers_remaining
int num_reserved_buffers_remaining(Client *client) const
Definition: buffered-block-mgr.cc:518

impala::Tuple::SetNull
void SetNull(const NullIndicatorOffset &offset)
Definition: tuple.h:101

impala::LlvmCodeGen::codegen_timer
RuntimeProfile::Counter * codegen_timer()
Definition: llvm-codegen.h:135

impala::AggFnEvaluator::intermediate_type
const ColumnType & intermediate_type() const
Definition: agg-fn-evaluator.h:110

runtime-profile.h

impala::PartitionedAggregationNode::needs_serialize_
bool needs_serialize_
Contains any evaluators that require the serialize step.
Definition: partitioned-aggregation-node.h:151

impala::TYPE_CHAR
Definition: types.h:47

impala::ExecNode::num_rows_returned_
int64_t num_rows_returned_
Definition: exec-node.h:223

impala::StringValue
Definition: string-value.h:33

codegen-anyval.h

impala::TupleRow::GetTuple
Tuple * GetTuple(int tuple_idx)
Definition: tuple-row.h:30

impala::PartitionedAggregationNode::partitions_created_
RuntimeProfile::Counter * partitions_created_
Total number of partitions created.
Definition: partitioned-aggregation-node.h:219

impala::BufferedTupleStream::Close
void Close()
Must be called once at the end to cleanup all resources. Idempotent.
Definition: buffered-tuple-stream.cc:145

impala::PartitionedAggregationNode::output_iterator_
HashTable::Iterator output_iterator_
Definition: partitioned-aggregation-node.h:199

slot-ref.h

impala::AggFnEvaluator::SUM
Definition: agg-fn-evaluator.h:70

impala::PartitionedAggregationNode::ConstructIntermediateTuple
Tuple * ConstructIntermediateTuple(const std::vector< impala_udf::FunctionContext * > &agg_fn_ctxs, MemPool *pool, BufferedTupleStream *stream)
Definition: partitioned-aggregation-node.cc:591

impala::RuntimeState::block_mgr
BufferedBlockMgr * block_mgr()
Definition: runtime-state.h:194

impala::ExecNode::mem_tracker
MemTracker * mem_tracker()
Definition: exec-node.h:162

impala::BufferedBlockMgr::MemLimitTooLowError
Status MemLimitTooLowError(Client *client)
Definition: buffered-block-mgr.cc:369

impala::TYPE_VARCHAR
Definition: types.h:48

impala::PartitionedAggregationNode::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: partitioned-aggregation-node.h:103

impala::PartitionedAggregationNode::GetOutputTuple
Tuple * GetOutputTuple(const std::vector< impala_udf::FunctionContext * > &agg_fn_ctxs, Tuple *tuple, MemPool *pool)
Definition: partitioned-aggregation-node.cc:688

impala::PartitionedAggregationNode::num_hash_buckets_
RuntimeProfile::Counter * num_hash_buckets_
Total number of hash buckets across all partitions.
Definition: partitioned-aggregation-node.h:216

impala::PartitionedAggregationNode::Partition::unaggregated_row_stream
boost::scoped_ptr< BufferedTupleStream > unaggregated_row_stream
Unaggregated rows that are spilled.
Definition: partitioned-aggregation-node.h:289

impala::PartitionedAggregationNode::Partition::agg_fn_pool
boost::scoped_ptr< MemPool > agg_fn_pool
Definition: partitioned-aggregation-node.h:280

impala::LlvmCodeGen::NamedVariable
Utility struct that wraps a variable name and llvm type.
Definition: llvm-codegen.h:149

impala::ExecNode::runtime_profile_
boost::scoped_ptr< RuntimeProfile > runtime_profile_
Definition: exec-node.h:225

impala::PartitionedAggregationNode::Partition::Close
void Close(bool finalize_rows)
Definition: partitioned-aggregation-node.cc:570

impala::Expr::Open
static Status Open(const std::vector< ExprContext * > &ctxs, RuntimeState *state)
Convenience function for opening multiple expr trees.

impala::PartitionedAggregationNode::state_
RuntimeState * state_
Definition: partitioned-aggregation-node.h:175

impala::PartitionedAggregationNode::singleton_output_tuple_returned_
bool singleton_output_tuple_returned_
Definition: partitioned-aggregation-node.h:185

impala::AggFnEvaluator
Definition: agg-fn-evaluator.h:62

impala::Tuple
A tuple with 0 materialised slots is represented as NULL.
Definition: tuple.h:48

impala::StringValue::len
int len
Definition: string-value.h:38

impala::ExprValue::SetToMin
void * SetToMin(const ColumnType &type)
Sets the value for type to min and returns a pointer to the data.
Definition: expr-value.h:103

RETURN_IF_ERROR
#define RETURN_IF_ERROR(stmt)
some generally useful macros
Definition: status.h:242

raw-value.h

impala::AggFnEvaluator::DebugString
std::string DebugString() const
Definition: agg-fn-evaluator.cc:518

impala::ExecNode::Init
virtual Status Init(const TPlanNode &tnode)
Definition: exec-node.cc:124

impala::RowBatch::GetRow
TupleRow * GetRow(int row_idx)
Definition: row-batch.h:140

impala::PartitionedAggregationNode::intermediate_row_desc_
boost::scoped_ptr< RowDescriptor > intermediate_row_desc_
Row with the intermediate tuple as its only tuple.
Definition: partitioned-aggregation-node.h:137

impala::PartitionedAggregationNode::Partition
Definition: partitioned-aggregation-node.h:237

impala::AggFnEvaluator::merge_symbol
const std::string & merge_symbol() const
Definition: agg-fn-evaluator.h:120

impala::Tuple::Init
void Init(int size)
Definition: tuple.h:58

impala::ExprValue
The materialized value returned by ExprContext::GetValue().
Definition: expr-value.h:25

impala::BufferedBlockMgr::num_pinned_buffers
int num_pinned_buffers(Client *client) const
Definition: buffered-block-mgr.cc:514

impala::ExprContext
Definition: expr-context.h:40

ADD_TIMER
#define ADD_TIMER(profile, name)
Definition: runtime-profile.h:50

impala::PartitionedAggregationNode::num_spilled_partitions_
RuntimeProfile::Counter * num_spilled_partitions_
Number of partitions that have been spilled.
Definition: partitioned-aggregation-node.h:231

impala::BufferedBlockMgr::RegisterClient
Status RegisterClient(int num_reserved_buffers, MemTracker *tracker, RuntimeState *state, Client **client)
Definition: buffered-block-mgr.cc:235

impala::PartitionedAggregationNode::serialize_stream_
boost::scoped_ptr< BufferedTupleStream > serialize_stream_
Definition: partitioned-aggregation-node.h:306

expr-context.h

impala::PartitionedAggregationNode::CleanupHashTbl
void CleanupHashTbl(const std::vector< impala_udf::FunctionContext * > &fn_ctxs, HashTable::Iterator it)
Calls finalizes on all tuples starting at 'it'.
Definition: partitioned-aggregation-node.cc:352

impala::PartitionedAggregationNode::Partition::is_spilled
bool is_spilled() const
Definition: partitioned-aggregation-node.h:261

impala::RowBatch::AtCapacity
bool AtCapacity()
Definition: row-batch.h:120

impala::CodegenAnyVal::ToNativeValue
llvm::Value * ToNativeValue()
Definition: codegen-anyval.cc:507

impala::Tuple::GetSlot
void * GetSlot(int offset)
Definition: tuple.h:118

impala::AggFnEvaluator::is_count_star
bool is_count_star() const
Definition: agg-fn-evaluator.h:114

impala::AggFnEvaluator::NDV
Definition: agg-fn-evaluator.h:72

impala::RowDescriptor
Definition: descriptors.h:373

impala::PartitionedAggregationNode::agg_fn_ctxs_
std::vector< impala_udf::FunctionContext * > agg_fn_ctxs_
Definition: partitioned-aggregation-node.h:161

impala::TupleDescriptor::slots
const std::vector< SlotDescriptor * > & slots() const
Definition: descriptors.h:302

impala::PartitionedAggregationNode::PARTITION_FANOUT
static const int PARTITION_FANOUT
Number of initial partitions to create. Must be a power of 2.
Definition: partitioned-aggregation-node.h:115

impala::TupleDescriptor::byte_size
int byte_size() const
Definition: descriptors.h:300

impala::LlvmCodeGen::boolean_type
llvm::Type * boolean_type()
Simple wrappers to reduce code verbosity.
Definition: llvm-codegen.h:385

impala::PartitionedAggregationNode::Partition::Spill
Status Spill(Tuple *tuple=NULL)
Definition: partitioned-aggregation-node.cc:467

impala::ObjectPool
Definition: object-pool.h:30

impala::PartitionedAggregationNode::CreateHashPartitions
Status CreateHashPartitions(int level)
Definition: partitioned-aggregation-node.cc:729

buffered-tuple-stream.inline.h

llvm::IRBuilder
Definition: llvm-codegen.h:60

impala::AggFnEvaluator::MAX
Definition: agg-fn-evaluator.h:69

impala::PartitionedAggregationNode::contains_var_len_grouping_exprs_
bool contains_var_len_grouping_exprs_
Definition: partitioned-aggregation-node.h:173

impala::SlotDescriptor
Definition: descriptors.h:75

impala::AggFnEvaluator::is_merge
bool is_merge() const
Definition: agg-fn-evaluator.h:111

impala::AggFnEvaluator::Create
static Status Create(ObjectPool *pool, const TExpr &desc, AggFnEvaluator **result)
Definition: agg-fn-evaluator.cc:64

impala::Status::AddDetail
void AddDetail(const std::string &msg)
Add a detail string. Calling this method is only defined on a non-OK message.
Definition: status.cc:166

impala::PartitionedAggregationNode::NextPartition
Status NextPartition()
Definition: partitioned-aggregation-node.cc:771

impala::TupleDescriptor::GenerateLlvmStruct
llvm::StructType * GenerateLlvmStruct(LlvmCodeGen *codegen)
Definition: descriptors.cc:556

impala::ExecNode::row_desc
const RowDescriptor & row_desc() const
Definition: exec-node.h:156

impala::Tuple::Create
static Tuple * Create(int size, MemPool *pool)
initialize individual tuple with data residing in mem pool
Definition: tuple.h:51

impala::PartitionedAggregationNode::output_tuple_id_
TupleId output_tuple_id_
Definition: partitioned-aggregation-node.h:141

impala::PartitionedAggregationNode::block_mgr_client_
BufferedBlockMgr::Client * block_mgr_client_
Definition: partitioned-aggregation-node.h:176

llvm-codegen.h

impala::CodegenAnyVal::GetUnloweredPtrType
static llvm::Type * GetUnloweredPtrType(LlvmCodeGen *cg, const ColumnType &type)
Definition: codegen-anyval.cc:112

COUNTER_ADD
#define COUNTER_ADD(c, v)
Definition: runtime-profile.h:55

impala::TupleRow
Definition: tuple-row.h:28

impala::SlotDescriptor::null_indicator_offset
const NullIndicatorOffset & null_indicator_offset() const
Definition: descriptors.h:89

impala::ExecNode::ExecDebugAction
Status ExecDebugAction(TExecNodePhase::type phase, RuntimeState *state)
Definition: exec-node.cc:378

impala::ExecNode::ReachedLimit
bool ReachedLimit()
Definition: exec-node.h:159

impala::TYPE_TIMESTAMP
Definition: types.h:37

impala::PartitionedAggregationNode::singleton_output_tuple_
Tuple * singleton_output_tuple_
Definition: partitioned-aggregation-node.h:184

impala::ExprValue::SetToMax
void * SetToMax(const ColumnType &type)
Sets the value for type to max and returns a pointer to the data.
Definition: expr-value.h:137

impala::AggFnEvaluator::agg_op
AggregationOp agg_op() const
Definition: agg-fn-evaluator.h:112

impala::DescriptorTbl::GetTupleDescriptor
TupleDescriptor * GetTupleDescriptor(TupleId id) const
Definition: descriptors.cc:437

SCOPED_TIMER
#define SCOPED_TIMER(c)
Definition: runtime-profile.h:53

impala::PartitionedAggregationNode::largest_partition_percent_
RuntimeProfile::HighWaterMarkCounter * largest_partition_percent_
Definition: partitioned-aggregation-node.h:235

impala::CodegenAnyVal::GetNonNullVal
static CodegenAnyVal GetNonNullVal(LlvmCodeGen *codegen, LlvmCodeGen::LlvmBuilder *builder, const ColumnType &type, const char *name="")
Definition: codegen-anyval.cc:674

impala::Expr::Close
static void Close(const std::vector< ExprContext * > &ctxs, RuntimeState *state)
Convenience function for closing multiple expr trees.

impala::PartitionedAggregationNode::num_row_repartitioned_
RuntimeProfile::Counter * num_row_repartitioned_
Number of rows that have been repartitioned.
Definition: partitioned-aggregation-node.h:225

impala::PartitionedAggregationNode::Init
virtual Status Init(const TPlanNode &tnode)
Definition: partitioned-aggregation-node.cc:82

impala::Tuple::IsNull
bool IsNull(const NullIndicatorOffset &offset) const
Definition: tuple.h:112

impala::PartitionedAggregationNode::SpillPartition
Status SpillPartition(Partition *curr_partition=NULL, Tuple *curr_intermediate_tuple=NULL)
Definition: partitioned-aggregation-node.cc:872

impala::ExecNode::type
TPlanNodeType::type type() const
Definition: exec-node.h:155

impala_udf::FunctionContext
Definition: udf.h:47

impala::LlvmCodeGen
LLVM code generator. This is the top level object to generate jitted code.
Definition: llvm-codegen.h:107

impala::PartitionedAggregationNode::Partition::InitHashTable
bool InitHashTable()
Initializes the hash table. Returns false on OOM.
Definition: partitioned-aggregation-node.cc:454

impala::BufferedBlockMgr::ClearReservations
void ClearReservations(Client *client)
Clears all reservations for this client.
Definition: buffered-block-mgr.cc:244

impala::SlotDescriptor::is_nullable
bool is_nullable() const
Definition: descriptors.h:93

impala::Status
Definition: status.h:81

impala::ExecNode::DebugString
std::string DebugString() const
Returns a string representation in DFS order of the plan rooted at this.
Definition: exec-node.cc:345

impala::ExecNode::expr_mem_tracker
MemTracker * expr_mem_tracker()
Definition: exec-node.h:163

impala::TupleRow::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: tuple-row.h:76

VLOG_QUERY
#define VLOG_QUERY
Definition: logging.h:57

impala::PartitionedAggregationNode::LargestSpilledPartition
int64_t LargestSpilledPartition() const
Definition: partitioned-aggregation-node.cc:758

impala::ExprContext::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: expr-context.h:126

impala::ColumnType::type
PrimitiveType type
Definition: types.h:60

impala::LlvmCodeGen::FnPrototype::AddArgument
void AddArgument(const NamedVariable &var)
Add argument.
Definition: llvm-codegen.h:171

impala::MemPool
Definition: mem-pool.h:77

impala::Tuple::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
For C++/IR interop, we need to be able to look up types by name.
Definition: tuple.h:134

impala::RuntimeState
Definition: runtime-state.h:69

impala::AggFnEvaluator::Serialize
void Serialize(FunctionContext *agg_fn_ctx, Tuple *dst)
Definition: agg-fn-evaluator.h:248

impala::SlotDescriptor::type
const ColumnType & type() const
Definition: descriptors.h:78

impala::PartitionedAggregationNode::mem_pool_
boost::scoped_ptr< MemPool > mem_pool_
Definition: partitioned-aggregation-node.h:189

impala::PartitionedAggregationNode::NUM_PARTITIONING_BITS
static const int NUM_PARTITIONING_BITS
Definition: partitioned-aggregation-node.h:121

impala::RuntimeState::obj_pool
ObjectPool * obj_pool() const
Definition: runtime-state.h:92

impala::HashTable
Definition: hash-table.h:281

impala::PartitionedAggregationNode::intermediate_tuple_id_
TupleId intermediate_tuple_id_
Tuple into which Update()/Merge()/Serialize() results are stored.
Definition: partitioned-aggregation-node.h:133

impala::FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME
static const char * LLVM_FUNCTIONCONTEXT_NAME
Definition: udf-internal.h:93

impala::AggFnEvaluator::COUNT
Definition: agg-fn-evaluator.h:67

impala::PrimitiveType
PrimitiveType
Definition: types.h:27

debug-util.h

impala::PartitionedAggregationNode::Partition::hash_tbl
boost::scoped_ptr< HashTable > hash_tbl
Definition: partitioned-aggregation-node.h:276

RETURN_IF_CANCELLED
#define RETURN_IF_CANCELLED(state)
Definition: runtime-state.h:384

pool
ObjectPool pool
Definition: expr-benchmark.cc:89

impala::AggFnEvaluator::Init
void Init(FunctionContext *agg_fn_ctx, Tuple *dst)
Functions for different phases of the aggregation.
Definition: agg-fn-evaluator.cc:314

partitioned-aggregation-node.h

string-value.inline.h

impala::ExecNode::Prepare
virtual Status Prepare(RuntimeState *state)
Definition: exec-node.cc:130

ADD_COUNTER
#define ADD_COUNTER(profile, name, unit)
Definition: runtime-profile.h:47

impala::RuntimeState::fragment_hash_seed
uint32_t fragment_hash_seed() const
Definition: runtime-state.h:154

impala::LlvmCodeGen::GetFunction
llvm::Function * GetFunction(IRFunction::Type)
Definition: llvm-codegen.cc:421

impala::HashTable::Iterator::Next
void IR_ALWAYS_INLINE Next()
Iterates to the next element. It should be called only if !AtEnd().
Definition: hash-table.inline.h:283

impala::RowBatch::MarkNeedToReturn
void MarkNeedToReturn()
Definition: row-batch.h:167

impala::LlvmCodeGen::AddFunctionToJit
void AddFunctionToJit(llvm::Function *fn, void **fn_ptr)
Definition: llvm-codegen.cc:714

impala::SlotDescriptor::CodegenUpdateNull
llvm::Function * CodegenUpdateNull(LlvmCodeGen *, llvm::StructType *tuple, bool set_null)
Definition: descriptors.cc:510

impala::RawValue::Write
static void Write(const void *value, Tuple *tuple, const SlotDescriptor *slot_desc, MemPool *pool)
Definition: raw-value.cc:303

impala::ExecNode::AddExprCtxsToFree
void AddExprCtxsToFree(const std::vector< ExprContext * > &ctxs)

impala::PartitionedAggregationNode::MAX_PARTITION_DEPTH
static const int MAX_PARTITION_DEPTH
Definition: partitioned-aggregation-node.h:130

impala::ExecNode::QueryMaintenance
virtual Status QueryMaintenance(RuntimeState *state)
Definition: exec-node.cc:401

impala::Expr
This is the superclass of all expr evaluation nodes.
Definition: expr.h:116

impala::PartitionedAggregationNode::Close
virtual void Close(RuntimeState *state)
Definition: partitioned-aggregation-node.cc:380

impala::PartitionedAggregationNode::max_partition_level_
RuntimeProfile::HighWaterMarkCounter * max_partition_level_
Level of max partition (i.e. number of repartitioning steps).
Definition: partitioned-aggregation-node.h:222

impala::TYPE_BOOLEAN
Definition: types.h:30

VLOG_ROW
#define VLOG_ROW
Definition: logging.h:59

impala::AggFnEvaluator::fn_name
const std::string & fn_name() const
Definition: agg-fn-evaluator.h:118

impala::RuntimeState::desc_tbl
const DescriptorTbl & desc_tbl() const
Definition: runtime-state.h:93

impala::TYPE_BIGINT
Definition: types.h:34

impala::ExecNode::is_closed
bool is_closed()
Definition: exec-node.h:242

impala::RowBatch::CommitLastRow
void CommitLastRow()
Definition: row-batch.h:109

impala::PartitionedAggregationNode::using_small_buffers_
bool using_small_buffers_
If true, the partitions in hash_partitions_ are using small buffers.
Definition: partitioned-aggregation-node.h:179

impala::PartitionedAggregationNode::Reset
virtual Status Reset(RuntimeState *state)
Definition: partitioned-aggregation-node.cc:375

impala::ExecNode::children_
std::vector< ExecNode * > children_
Definition: exec-node.h:214

impala::PartitionedAggregationNode::Partition::parent
PartitionedAggregationNode * parent
Definition: partitioned-aggregation-node.h:263

runtime-state.h

impala::PartitionedAggregationNode::hash_partitions_
std::vector< Partition * > hash_partitions_
Current partitions we are partitioning into.
Definition: partitioned-aggregation-node.h:293

impala::PartitionedAggregationNode::build_timer_
RuntimeProfile::Counter * build_timer_
Time spent processing the child rows.
Definition: partitioned-aggregation-node.h:207

impala::RowBatch
Definition: row-batch.h:66

impala::ExecNode::rows_returned
int64_t rows_returned() const
Definition: exec-node.h:157

COUNTER_SET
#define COUNTER_SET(c, v)
Definition: runtime-profile.h:56

count
uint64_t count
Definition: partitioning-throughput-test.cc:35

impala::RuntimeState::batch_size
int batch_size() const
Definition: runtime-state.h:98

impala::PartitionedAggregationNode::CodegenUpdateTuple
llvm::Function * CodegenUpdateTuple()
Codegen UpdateTuple(). Returns NULL if codegen is unsuccessful.
Definition: partitioned-aggregation-node.cc:1241

impala::PartitionedAggregationNode::aggregated_partitions_
std::list< Partition * > aggregated_partitions_
Definition: partitioned-aggregation-node.h:301

impala::RowBatch::tuple_data_pool
MemPool * tuple_data_pool()
Definition: row-batch.h:148

impala::ExecNode::rows_returned_counter_
RuntimeProfile::Counter * rows_returned_counter_
Definition: exec-node.h:226

impala::Status::MEM_LIMIT_EXCEEDED
static const Status MEM_LIMIT_EXCEEDED
Definition: status.h:89

impala::ExecNode::child
ExecNode * child(int i)
Definition: exec-node.h:241

impala::PartitionedAggregationNode::intermediate_tuple_desc_
TupleDescriptor * intermediate_tuple_desc_
Definition: partitioned-aggregation-node.h:134

impala::PartitionedAggregationNode::CodegenProcessBatch
llvm::Function * CodegenProcessBatch()
Definition: partitioned-aggregation-node.cc:1356

impala::RuntimeState::SetMemLimitExceeded
Status SetMemLimitExceeded(MemTracker *tracker=NULL, int64_t failed_allocation_size=0)
Definition: runtime-state.cc:247

impala::PartitionedAggregationNode::num_repartitions_
RuntimeProfile::Counter * num_repartitions_
Number of partitions that have been repartitioned.
Definition: partitioned-aggregation-node.h:228

impala::AggFnEvaluator::update_symbol
const std::string & update_symbol() const
Definition: agg-fn-evaluator.h:119

impala::TupleRow::SetTuple
void SetTuple(int tuple_idx, Tuple *tuple)
Definition: tuple-row.h:34

impala::Expr::type
const ColumnType & type() const
Definition: expr.h:145

impala::CodegenAnyVal::value
llvm::Value * value()
Returns the current type-lowered value.
Definition: codegen-anyval.h:135

impala::ErrorMsg
Definition: error-util.h:47

impala::PartitionedAggregationNode::needs_finalize_
const bool needs_finalize_
Definition: partitioned-aggregation-node.h:148

impala::ExprContext::FreeLocalAllocations
void FreeLocalAllocations()
Definition: expr-context.cc:109

impala::TYPE_NULL
Definition: types.h:29

impala::Status::SetErrorMsg
void SetErrorMsg(const ErrorMsg &m)
Definition: status.h:197

impala::BitUtil::NextPowerOfTwo
static int64_t NextPowerOfTwo(int64_t v)
Definition: bit-util.h:50

impala::PartitionedAggregationNode::output_tuple_desc_
TupleDescriptor * output_tuple_desc_
Definition: partitioned-aggregation-node.h:142

impala::RowBatch::AddRow
int AddRow()
Definition: row-batch.h:100

UNLIKELY
#define UNLIKELY(expr)
Definition: compiler-util.h:33

impala::RuntimeState::codegen_enabled
bool codegen_enabled() const
Returns true if codegen is enabled for this query.
Definition: runtime-state.h:183

impala::BufferedTupleStream::status
Status status() const
Definition: buffered-tuple-stream.h:228

impala::BufferedTupleStream::AddRow
bool AddRow(TupleRow *row, uint8_t **dst=NULL)
Definition: buffered-tuple-stream.inline.h:25

impala::RuntimeProfile::AddHighWaterMarkCounter
HighWaterMarkCounter * AddHighWaterMarkCounter(const std::string &name, TUnit::type unit, const std::string &parent_counter_name="")

impala::SlotRef
Reference to a single slot of a tuple.
Definition: slot-ref.h:23

impala::BufferedTupleStream::AllocateRow
uint8_t * AllocateRow(int size)
Definition: buffered-tuple-stream.inline.h:34

impala::PartitionedAggregationNode::Partition::agg_fn_ctxs
std::vector< impala_udf::FunctionContext * > agg_fn_ctxs
Clone of parent's agg_fn_ctxs_ and backing MemPool.
Definition: partitioned-aggregation-node.h:279

impala::PartitionedAggregationNode::process_row_batch_fn_
ProcessRowBatchFn process_row_batch_fn_
Jitted ProcessRowBatch function pointer. Null if codegen is disabled.
Definition: partitioned-aggregation-node.h:204

impala::ColumnType
Definition: types.h:59

impala::CodegenAnyVal::GetVal
llvm::Value * GetVal(const char *name="val")
Definition: codegen-anyval.cc:258

impala::BufferedTupleStream::PrepareForRead
Status PrepareForRead(bool *got_buffer=NULL)
Definition: buffered-tuple-stream.cc:314

impala::Status::OK
static const Status OK
Definition: status.h:87

hash-table.inline.h

impala::ExecNode::pool_
ObjectPool * pool_
Definition: exec-node.h:211

impala::PartitionedAggregationNode::Partition::aggregated_row_stream
boost::scoped_ptr< BufferedTupleStream > aggregated_row_stream
Definition: partitioned-aggregation-node.h:286

impala::Expr::GetCodegendComputeFn
virtual Status GetCodegendComputeFn(RuntimeState *state, llvm::Function **fn)=0

tuple.h

impala::LlvmCodeGen::GetType
llvm::Type * GetType(const ColumnType &type)
Returns llvm type for the column type.
Definition: llvm-codegen.cc:312

expr.h

impala::RuntimeState::GetCodegen
Status GetCodegen(LlvmCodeGen **codegen, bool initialize=true)
Definition: runtime-state.cc:312

impala::BufferedTupleStream::num_rows
int64_t num_rows() const
Number of rows in the stream.
Definition: buffered-tuple-stream.h:231

impala::PartitionedAggregationNode::get_results_timer_
RuntimeProfile::Counter * get_results_timer_
Time spent returning the aggregated rows.
Definition: partitioned-aggregation-node.h:213

impala::AggFnEvaluator::AVG
Definition: agg-fn-evaluator.h:71

impala::SlotDescriptor::tuple_offset
int tuple_offset() const
Definition: descriptors.h:88

mem-pool.h

impala::SlotDescriptor::field_idx
int field_idx() const
Returns the field index in the generated llvm struct for this slot's tuple.
Definition: descriptors.h:87

impala::CodegenAnyVal::GetIsNull
llvm::Value * GetIsNull(const char *name="is_null")
Gets the 'is_null' field of the *Val.
Definition: codegen-anyval.cc:171

names.h

impala::LlvmCodeGen::GetIntConstant
llvm::Value * GetIntConstant(PrimitiveType type, int64_t val)
Returns the constant 'val' of 'type'.
Definition: llvm-codegen.cc:371

impala::PartitionedAggregationNode::QueryMaintenance
virtual Status QueryMaintenance(RuntimeState *state)
Frees local allocations from aggregate_evaluators_ and agg_fn_ctxs.
Definition: partitioned-aggregation-node.cc:968

impala::ExecNode
Definition: exec-node.h:46

impala::ObjectPool::Add
T * Add(T *t)
Definition: object-pool.h:42

impala::Expr::CreateExprTrees
static Status CreateExprTrees(ObjectPool *pool, const std::vector< TExpr > &texprs, std::vector< ExprContext * > *ctxs)
Definition: expr.cc:149

impala::LlvmCodeGen::FinalizeFunction
llvm::Function * FinalizeFunction(llvm::Function *function)
Definition: llvm-codegen.cc:596

impala::PartitionedAggregationNode::ProcessBatchNoGrouping
Status ProcessBatchNoGrouping(RowBatch *batch, HashTableCtx *ht_ctx=NULL)
Definition: partitioned-aggregation-node-ir.cc:24

impala::ExecNode::EvalConjuncts
static bool EvalConjuncts(ExprContext *const *ctxs, int num_ctxs, TupleRow *row)
Definition: exec-node.cc:393

tuple-row.h

impala::SlotDescriptor::is_materialized
bool is_materialized() const
Definition: descriptors.h:92

impala::PartitionedAggregationNode::Prepare
virtual Status Prepare(RuntimeState *state)
Definition: partitioned-aggregation-node.cc:95

impala::TYPE_STRING
Definition: types.h:38

impala::AggFnEvaluator::MIN
Definition: agg-fn-evaluator.h:68

impala::Expr::Prepare
static Status Prepare(const std::vector< ExprContext * > &ctxs, RuntimeState *state, const RowDescriptor &row_desc, MemTracker *tracker)

impala::PartitionedAggregationNode::agg_fn_pool_
boost::scoped_ptr< MemPool > agg_fn_pool_
Definition: partitioned-aggregation-node.h:162

impala::PartitionedAggregationNode::Partition::level
const int level
Definition: partitioned-aggregation-node.h:271

VLOG_ROW_IS_ON
#define VLOG_ROW_IS_ON
Definition: logging.h:66

impala::PartitionedAggregationNode::aggregate_evaluators_
std::vector< AggFnEvaluator * > aggregate_evaluators_
Definition: partitioned-aggregation-node.h:153

impala::ExecNode::Open
virtual Status Open(RuntimeState *state)
Definition: exec-node.cc:154

impala::PartitionedAggregationNode::probe_expr_ctxs_
std::vector< ExprContext * > probe_expr_ctxs_
Exprs used to evaluate input rows.
Definition: partitioned-aggregation-node.h:165

impala::LlvmCodeGen::ReplaceCallSites
llvm::Function * ReplaceCallSites(llvm::Function *caller, bool update_in_place, llvm::Function *new_fn, const std::string &target_name, int *num_replaced)
Definition: llvm-codegen.cc:489

impala::PrintRow
string PrintRow(TupleRow *row, const RowDescriptor &d)
Definition: debug-util.cc:192

impala::Status::ok
bool ok() const
Definition: status.h:172

impala::PartitionedAggregationNode::build_expr_ctxs_
std::vector< ExprContext * > build_expr_ctxs_
Definition: partitioned-aggregation-node.h:169

impala::LlvmCodeGen::void_type
llvm::Type * void_type()
Definition: llvm-codegen.h:394

impala::PartitionedAggregationNode::ProcessStream
Status ProcessStream(BufferedTupleStream *input_stream)
Reads all the rows from input_stream and process them by calling ProcessBatch().
Definition: partitioned-aggregation-node.cc:849

impala::ExecNode::id_
int id_
Definition: exec-node.h:209

impala::ExecNode::conjunct_ctxs_
std::vector< ExprContext * > conjunct_ctxs_
Definition: exec-node.h:212

impala::PartitionedAggregationNode::Partition::InitStreams
Status InitStreams()
Definition: partitioned-aggregation-node.cc:429

impala::ExecNode::Close
virtual void Close(RuntimeState *state)
Definition: exec-node.cc:166

impala::LlvmCodeGen::context
llvm::LLVMContext & context()
Definition: llvm-codegen.h:214

descriptors.h

impala::BufferedTupleStream::GetNext
Status GetNext(RowBatch *batch, bool *eos, std::vector< RowIdx > *indices=NULL)
Definition: buffered-tuple-stream.cc:447

impala::Expr::DebugString
virtual std::string DebugString() const
Definition: expr.cc:385

udf-internal.h

impala::LlvmCodeGen::OptimizeFunctionWithExprs
llvm::Function * OptimizeFunctionWithExprs(llvm::Function *fn)
Definition: llvm-codegen.cc:583

impala::PartitionedAggregationNode::UpdateTuple
void UpdateTuple(impala_udf::FunctionContext **agg_fn_ctxs, Tuple *tuple, TupleRow *row, bool is_merge=false)
Definition: partitioned-aggregation-node.cc:676

impala::HashTableCtx
Definition: hash-table.h:104

impala::TYPE_FLOAT
Definition: types.h:35

impala::PartitionedAggregationNode::Open
virtual Status Open(RuntimeState *state)
Definition: partitioned-aggregation-node.cc:209

impala::PartitionedAggregationNode::GetNext
virtual Status GetNext(RuntimeState *state, RowBatch *row_batch, bool *eos)
Definition: partitioned-aggregation-node.cc:271

impala::PartitionedAggregationNode::ht_ctx_
boost::scoped_ptr< HashTableCtx > ht_ctx_
Definition: partitioned-aggregation-node.h:194

impala::LlvmCodeGen::FnPrototype
Definition: llvm-codegen.h:161

impala::PartitionedAggregationNode::CodegenUpdateSlot
llvm::Function * CodegenUpdateSlot(AggFnEvaluator *evaluator, SlotDescriptor *slot_desc)
Definition: partitioned-aggregation-node.cc:1055

impala::PartitionedAggregationNode::ht_resize_timer_
RuntimeProfile::Counter * ht_resize_timer_
Total time spent resizing hash tables.
Definition: partitioned-aggregation-node.h:210

impala::PartitionedAggregationNode::PartitionedAggregationNode
PartitionedAggregationNode(ObjectPool *pool, const TPlanNode &tnode, const DescriptorTbl &descs)
Definition: partitioned-aggregation-node.cc:56

impala::TYPE_DECIMAL
Definition: types.h:42

impala::ExecNode::runtime_profile
RuntimeProfile * runtime_profile()
Definition: exec-node.h:161

impala::AggFnEvaluator::Finalize
void Finalize(FunctionContext *agg_fn_ctx, Tuple *src, Tuple *dst)
Definition: agg-fn-evaluator.h:252

impala::AggFnEvaluator::input_expr_ctxs
const std::vector< ExprContext * > & input_expr_ctxs() const
Definition: agg-fn-evaluator.h:113