doc/html/aggregation-node_8cc_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #include "exec/aggregation-node.h"


 #include <math.h>

 #include <sstream>

 #include <boost/functional/hash.hpp>

 #include <thrift/protocol/TDebugProtocol.h>


 #include <x86intrin.h>


 #include "codegen/codegen-anyval.h"

 #include "codegen/llvm-codegen.h"

 #include "exec/old-hash-table.inline.h"

 #include "exprs/agg-fn-evaluator.h"

 #include "exprs/expr.h"

 #include "exprs/expr-context.h"

 #include "exprs/slot-ref.h"

 #include "runtime/descriptors.h"

 #include "runtime/mem-pool.h"

 #include "runtime/raw-value.h"

 #include "runtime/row-batch.h"

 #include "runtime/runtime-state.h"

 #include "runtime/string-value.inline.h"

 #include "runtime/tuple.h"

 #include "runtime/tuple-row.h"

 #include "udf/udf-internal.h"

 #include "util/debug-util.h"

 #include "util/runtime-profile.h"


 #include "gen-cpp/Exprs_types.h"

 #include "gen-cpp/PlanNodes_types.h"


 #include "common/names.h"


 using namespace impala;

 using namespace llvm;


 namespace impala {


 const char* AggregationNode::LLVM_CLASS_NAME = "class.impala::AggregationNode";


 // TODO: pass in maximum size; enforce by setting limit in mempool

 AggregationNode::AggregationNode(ObjectPool* pool, const TPlanNode& tnode,

                                  const DescriptorTbl& descs)

   : ExecNode(pool, tnode, descs),

     intermediate_tuple_id_(tnode.agg_node.intermediate_tuple_id),

     intermediate_tuple_desc_(NULL),

     output_tuple_id_(tnode.agg_node.output_tuple_id),

     output_tuple_desc_(NULL),

     singleton_intermediate_tuple_(NULL),

     codegen_process_row_batch_fn_(NULL),

     process_row_batch_fn_(NULL),

     needs_finalize_(tnode.agg_node.need_finalize),

     build_timer_(NULL),

     get_results_timer_(NULL),

     hash_table_buckets_counter_(NULL) {

 }


 Status AggregationNode::Init(const TPlanNode& tnode) {

   RETURN_IF_ERROR(ExecNode::Init(tnode));

   RETURN_IF_ERROR(

       Expr::CreateExprTrees(pool_, tnode.agg_node.grouping_exprs, &probe_expr_ctxs_));

   for (int i = 0; i < tnode.agg_node.aggregate_functions.size(); ++i) {

     AggFnEvaluator* evaluator;

     RETURN_IF_ERROR(AggFnEvaluator::Create(

         pool_, tnode.agg_node.aggregate_functions[i], &evaluator));

     aggregate_evaluators_.push_back(evaluator);

   }

   return Status::OK;

 }


 Status AggregationNode::Prepare(RuntimeState* state) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());

   RETURN_IF_ERROR(ExecNode::Prepare(state));


   tuple_pool_.reset(new MemPool(mem_tracker()));

   agg_fn_pool_.reset(new MemPool(expr_mem_tracker()));

   build_timer_ = ADD_TIMER(runtime_profile(), "BuildTime");

   get_results_timer_ = ADD_TIMER(runtime_profile(), "GetResultsTime");

   hash_table_buckets_counter_ =

       ADD_COUNTER(runtime_profile(), "BuildBuckets", TUnit::UNIT);

   hash_table_load_factor_counter_ =

       ADD_COUNTER(runtime_profile(), "LoadFactor", TUnit::DOUBLE_VALUE);


   intermediate_tuple_desc_ =

       state->desc_tbl().GetTupleDescriptor(intermediate_tuple_id_);

   output_tuple_desc_ = state->desc_tbl().GetTupleDescriptor(output_tuple_id_);

   DCHECK_EQ(intermediate_tuple_desc_->slots().size(),

       output_tuple_desc_->slots().size());

   RETURN_IF_ERROR(

       Expr::Prepare(probe_expr_ctxs_, state, child(0)->row_desc(), expr_mem_tracker()));


   // Construct build exprs from intermediate_agg_tuple_desc_

   for (int i = 0; i < probe_expr_ctxs_.size(); ++i) {

     SlotDescriptor* desc = intermediate_tuple_desc_->slots()[i];

     DCHECK(desc->type().type == TYPE_NULL ||

            desc->type() == probe_expr_ctxs_[i]->root()->type());

     // TODO: Generate the build exprs in the FE such that the existing logic

     // for handling NULL_TYPE works.

     // Hack to avoid TYPE_NULL SlotRefs.

     Expr* expr = desc->type().type != TYPE_NULL ?

         new SlotRef(desc) : new SlotRef(desc, TYPE_BOOLEAN);

     state->obj_pool()->Add(expr);

     build_expr_ctxs_.push_back(new ExprContext(expr));

     state->obj_pool()->Add(build_expr_ctxs_.back());

   }

   // Construct a new row desc for preparing the build exprs because neither the child's

   // nor this node's output row desc may contain the intermediate tuple, e.g.,

   // in a single-node plan with an intermediate tuple different from the output tuple.

   RowDescriptor build_row_desc(intermediate_tuple_desc_, false);

   RETURN_IF_ERROR(

       Expr::Prepare(build_expr_ctxs_, state, build_row_desc, expr_mem_tracker()));


   agg_fn_ctxs_.resize(aggregate_evaluators_.size());

   int j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1)

           << "#eval= " << aggregate_evaluators_.size()

           << " #probe=" << probe_expr_ctxs_.size();

       ++j;

     }

     SlotDescriptor* intermediate_slot_desc = intermediate_tuple_desc_->slots()[j];

     SlotDescriptor* output_slot_desc = output_tuple_desc_->slots()[j];

     RETURN_IF_ERROR(aggregate_evaluators_[i]->Prepare(state, child(0)->row_desc(),

         intermediate_slot_desc, output_slot_desc, agg_fn_pool_.get(), &agg_fn_ctxs_[i]));

     state->obj_pool()->Add(agg_fn_ctxs_[i]);

   }


   // TODO: how many buckets?

   hash_tbl_.reset(new OldHashTable(state, build_expr_ctxs_, probe_expr_ctxs_, 1,

                                    true, true, id(), mem_tracker(), true));


   if (probe_expr_ctxs_.empty()) {

     // create single intermediate tuple now; we need to output something

     // even if our input is empty

     singleton_intermediate_tuple_ = ConstructIntermediateTuple();

     hash_tbl_->Insert(singleton_intermediate_tuple_);

     output_iterator_ = hash_tbl_->Begin();

   }


   if (state->codegen_enabled()) {

     LlvmCodeGen* codegen;

     RETURN_IF_ERROR(state->GetCodegen(&codegen));

     Function* update_tuple_fn = CodegenUpdateTuple(state);

     if (update_tuple_fn != NULL) {

       codegen_process_row_batch_fn_ =

           CodegenProcessRowBatch(state, update_tuple_fn);

       if (codegen_process_row_batch_fn_ != NULL) {

         // Update to using codegen'd process row batch.

         codegen->AddFunctionToJit(codegen_process_row_batch_fn_,

             reinterpret_cast<void**>(&process_row_batch_fn_));

         AddRuntimeExecOption("Codegen Enabled");

       }

     }

   }

   return Status::OK;

 }


 Status AggregationNode::Open(RuntimeState* state) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());

   RETURN_IF_ERROR(ExecNode::Open(state));


   RETURN_IF_ERROR(Expr::Open(probe_expr_ctxs_, state));

   RETURN_IF_ERROR(Expr::Open(build_expr_ctxs_, state));


   DCHECK_EQ(aggregate_evaluators_.size(), agg_fn_ctxs_.size());

   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     RETURN_IF_ERROR(aggregate_evaluators_[i]->Open(state, agg_fn_ctxs_[i]));

   }


   RETURN_IF_ERROR(children_[0]->Open(state));


   RowBatch batch(children_[0]->row_desc(), state->batch_size(), mem_tracker());

   int64_t num_input_rows = 0;

   while (true) {

     bool eos;

     RETURN_IF_CANCELLED(state);

     RETURN_IF_ERROR(QueryMaintenance(state));

     RETURN_IF_ERROR(children_[0]->GetNext(state, &batch, &eos));

     SCOPED_TIMER(build_timer_);


     if (VLOG_ROW_IS_ON) {

       for (int i = 0; i < batch.num_rows(); ++i) {

         TupleRow* row = batch.GetRow(i);

         VLOG_ROW << "input row: " << PrintRow(row, children_[0]->row_desc());

       }

     }

     if (process_row_batch_fn_ != NULL) {

       process_row_batch_fn_(this, &batch);

     } else if (probe_expr_ctxs_.empty()) {

       ProcessRowBatchNoGrouping(&batch);

     } else {

       ProcessRowBatchWithGrouping(&batch);

     }

     COUNTER_SET(hash_table_buckets_counter_, hash_tbl_->num_buckets());

     COUNTER_SET(hash_table_load_factor_counter_, hash_tbl_->load_factor());

     num_input_rows += batch.num_rows();

     // We must set output_iterator_ here, rather than outside the loop, because

     // output_iterator_ must be set if the function returns within the loop

     output_iterator_ = hash_tbl_->Begin();


     batch.Reset();

     RETURN_IF_ERROR(QueryMaintenance(state));

     if (eos) break;

   }


   // We have consumed all of the input from the child and transfered ownership of the

   // resources we need, so the child can be closed safely to release its resources.

   child(0)->Close(state);

   VLOG_FILE << "aggregated " << num_input_rows << " input rows into "

             << hash_tbl_->size() << " output rows";

   return Status::OK;

 }


 Status AggregationNode::GetNext(RuntimeState* state, RowBatch* row_batch, bool* eos) {

   SCOPED_TIMER(runtime_profile_->total_time_counter());

   RETURN_IF_ERROR(ExecDebugAction(TExecNodePhase::GETNEXT, state));

   RETURN_IF_CANCELLED(state);

   RETURN_IF_ERROR(QueryMaintenance(state));

   SCOPED_TIMER(get_results_timer_);


   if (ReachedLimit()) {

     *eos = true;

     return Status::OK;

   }

   *eos = false;

   ExprContext** ctxs = &conjunct_ctxs_[0];

   int num_ctxs = conjunct_ctxs_.size();


   int count = 0;

   const int N = state->batch_size();

   while (!output_iterator_.AtEnd() && !row_batch->AtCapacity()) {

     // This loop can go on for a long time if the conjuncts are very selective. Do query

     // maintenance every N iterations.

     if (count++ % N == 0) {

       RETURN_IF_CANCELLED(state);

       RETURN_IF_ERROR(QueryMaintenance(state));

     }

     int row_idx = row_batch->AddRow();

     TupleRow* row = row_batch->GetRow(row_idx);

     Tuple* intermediate_tuple = output_iterator_.GetTuple();

     Tuple* output_tuple =

         FinalizeTuple(intermediate_tuple, row_batch->tuple_data_pool());

     output_iterator_.Next<false>();

     row->SetTuple(0, output_tuple);

     if (ExecNode::EvalConjuncts(ctxs, num_ctxs, row)) {

       VLOG_ROW << "output row: " << PrintRow(row, row_desc());

       row_batch->CommitLastRow();

       ++num_rows_returned_;

       if (ReachedLimit()) break;

     }

   }

   *eos = output_iterator_.AtEnd() || ReachedLimit();

   COUNTER_SET(rows_returned_counter_, num_rows_returned_);

   return Status::OK;

 }


 Status AggregationNode::Reset(RuntimeState* state) {

   DCHECK(false) << "NYI";

   return Status("NYI");

 }


 void AggregationNode::Close(RuntimeState* state) {

   if (is_closed()) return;


   // Iterate through the remaining rows in the hash table and call Serialize/Finalize on

   // them in order to free any memory allocated by UDAs. Finalize() requires a dst tuple

   // but we don't actually need the result, so allocate a single dummy tuple to avoid

   // accumulating memory.

   Tuple* dummy_dst = NULL;

   if (needs_finalize_) {

     dummy_dst = Tuple::Create(output_tuple_desc_->byte_size(), tuple_pool_.get());

   }

   while (!output_iterator_.AtEnd()) {

     Tuple* tuple = output_iterator_.GetTuple();

     if (needs_finalize_) {

       AggFnEvaluator::Finalize(aggregate_evaluators_, agg_fn_ctxs_, tuple, dummy_dst);

     } else {

       AggFnEvaluator::Serialize(aggregate_evaluators_, agg_fn_ctxs_, tuple);

     }

     output_iterator_.Next<false>();

   }


   if (tuple_pool_.get() != NULL) tuple_pool_->FreeAll();

   if (hash_tbl_.get() != NULL) hash_tbl_->Close();


   DCHECK(agg_fn_ctxs_.empty() || aggregate_evaluators_.size() == agg_fn_ctxs_.size());

   for (int i = 0; i < aggregate_evaluators_.size(); ++i) {

     aggregate_evaluators_[i]->Close(state);

     if (!agg_fn_ctxs_.empty()) agg_fn_ctxs_[i]->impl()->Close();

   }

   if (agg_fn_pool_.get() != NULL) agg_fn_pool_->FreeAll();


   Expr::Close(probe_expr_ctxs_, state);

   Expr::Close(build_expr_ctxs_, state);

   ExecNode::Close(state);

 }


 Tuple* AggregationNode::ConstructIntermediateTuple() {

   Tuple* intermediate_tuple = Tuple::Create(

       intermediate_tuple_desc_->byte_size(), tuple_pool_.get());

   vector<SlotDescriptor*>::const_iterator slot_desc =

       intermediate_tuple_desc_->slots().begin();


   // copy grouping values

   for (int i = 0; i < probe_expr_ctxs_.size(); ++i, ++slot_desc) {

     if (hash_tbl_->last_expr_value_null(i)) {

       intermediate_tuple->SetNull((*slot_desc)->null_indicator_offset());

     } else {

       void* src = hash_tbl_->last_expr_value(i);

       void* dst = intermediate_tuple->GetSlot((*slot_desc)->tuple_offset());

       RawValue::Write(src, dst, (*slot_desc)->type(), tuple_pool_.get());

     }

   }


   // Initialize aggregate output.

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++slot_desc) {

     while (!(*slot_desc)->is_materialized()) ++slot_desc;

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];

     evaluator->Init(agg_fn_ctxs_[i], intermediate_tuple);

     // Codegen specific path.

     // To minimize branching on the UpdateTuple path, initialize the result value

     // so that UpdateTuple doesn't have to check if the aggregation

     // dst slot is null.

     //  - sum/count: 0

     //  - min: max_value

     //  - max: min_value

     // TODO: remove when we don't use the irbuilder for codegen here.

     // This optimization no longer applies with AnyVal

     if ((*slot_desc)->type().type != TYPE_STRING &&

         (*slot_desc)->type().type != TYPE_VARCHAR &&

         (*slot_desc)->type().type != TYPE_TIMESTAMP &&

         (*slot_desc)->type().type != TYPE_CHAR &&

         (*slot_desc)->type().type != TYPE_DECIMAL) {

       ExprValue default_value;

       void* default_value_ptr = NULL;

       switch (evaluator->agg_op()) {

         case AggFnEvaluator::MIN:

           default_value_ptr = default_value.SetToMax((*slot_desc)->type());

           RawValue::Write(default_value_ptr, intermediate_tuple, *slot_desc, NULL);

           break;

         case AggFnEvaluator::MAX:

           default_value_ptr = default_value.SetToMin((*slot_desc)->type());

           RawValue::Write(default_value_ptr, intermediate_tuple, *slot_desc, NULL);

           break;

         default:

           break;

       }

     }

   }

   return intermediate_tuple;

 }


 void AggregationNode::UpdateTuple(Tuple* tuple, TupleRow* row) {

   DCHECK(tuple != NULL || aggregate_evaluators_.empty());

   AggFnEvaluator::Add(aggregate_evaluators_, agg_fn_ctxs_, row, tuple);

 }


 Tuple* AggregationNode::FinalizeTuple(Tuple* tuple, MemPool* pool) {

   DCHECK(tuple != NULL || aggregate_evaluators_.empty());

   Tuple* dst = tuple;

   if (needs_finalize_ && intermediate_tuple_id_ != output_tuple_id_) {

     dst = Tuple::Create(output_tuple_desc_->byte_size(), pool);

   }

   if (needs_finalize_) {

     AggFnEvaluator::Finalize(aggregate_evaluators_, agg_fn_ctxs_, tuple, dst);

   } else {

     AggFnEvaluator::Serialize(aggregate_evaluators_, agg_fn_ctxs_, tuple);

   }

   // Copy grouping values from tuple to dst.

   // TODO: Codegen this.

   if (dst != tuple) {

     int num_grouping_slots = probe_expr_ctxs_.size();

     for (int i = 0; i < num_grouping_slots; ++i) {

       SlotDescriptor* src_slot_desc = intermediate_tuple_desc_->slots()[i];

       SlotDescriptor* dst_slot_desc = output_tuple_desc_->slots()[i];

       bool src_slot_null = tuple->IsNull(src_slot_desc->null_indicator_offset());

       void* src_slot = NULL;

       if (!src_slot_null) src_slot = tuple->GetSlot(src_slot_desc->tuple_offset());

       RawValue::Write(src_slot, dst, dst_slot_desc, NULL);

     }

   }

   return dst;

 }


 void AggregationNode::DebugString(int indentation_level, stringstream* out) const {

   *out << string(indentation_level * 2, ' ');

   *out << "AggregationNode("

        << "intermediate_tuple_id=" << intermediate_tuple_id_

        << " output_tuple_id=" << output_tuple_id_

        << " needs_finalize=" << needs_finalize_

        << " probe_exprs=" << Expr::DebugString(probe_expr_ctxs_)

        << " agg_exprs=" << AggFnEvaluator::DebugString(aggregate_evaluators_);

   ExecNode::DebugString(indentation_level, out);

   *out << ")";

 }


 IRFunction::Type GetHllUpdateFunction2(const ColumnType& type) {

   switch (type.type) {

     case TYPE_BOOLEAN: return IRFunction::HLL_UPDATE_BOOLEAN;

     case TYPE_TINYINT: return IRFunction::HLL_UPDATE_TINYINT;

     case TYPE_SMALLINT: return IRFunction::HLL_UPDATE_SMALLINT;

     case TYPE_INT: return IRFunction::HLL_UPDATE_INT;

     case TYPE_BIGINT: return IRFunction::HLL_UPDATE_BIGINT;

     case TYPE_FLOAT: return IRFunction::HLL_UPDATE_FLOAT;

     case TYPE_DOUBLE: return IRFunction::HLL_UPDATE_DOUBLE;

     case TYPE_STRING: return IRFunction::HLL_UPDATE_STRING;

     case TYPE_DECIMAL: return IRFunction::HLL_UPDATE_DECIMAL;

     default:

       DCHECK(false) << "Unsupported type: " << type;

       return IRFunction::FN_END;

   }

 }


 // IR Generation for updating a single aggregation slot. Signature is:

 // void UpdateSlot(FunctionContext* fn_ctx, AggTuple* agg_tuple, char** row)

 //

 // The IR for sum(double_col) is:

 // define void @UpdateSlot(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                         { i8, double }* %agg_tuple,

 //                         %"class.impala::TupleRow"* %row) #20 {

 // entry:

 //   %src = call { i8, double } @GetSlotRef(%"class.impala::ExprContext"* inttoptr

 //     (i64 128241264 to %"class.impala::ExprContext"*), %"class.impala::TupleRow"* %row)

 //   %0 = extractvalue { i8, double } %src, 0

 //   %is_null = trunc i8 %0 to i1

 //   br i1 %is_null, label %ret, label %src_not_null

 //

 // src_not_null:                                     ; preds = %entry

 //   %dst_slot_ptr = getelementptr inbounds { i8, double }* %agg_tuple, i32 0, i32 1

 //   call void @SetNotNull({ i8, double }* %agg_tuple)

 //   %dst_val = load double* %dst_slot_ptr

 //   %val = extractvalue { i8, double } %src, 1

 //   %1 = fadd double %dst_val, %val

 //   store double %1, double* %dst_slot_ptr

 //   br label %ret

 //

 // ret:                                              ; preds = %src_not_null, %entry

 //   ret void

 // }

 //

 // The IR for ndv(double_col) is:

 // define void @UpdateSlot(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                         { i8, %"struct.impala::StringValue" }* %agg_tuple,

 //                         %"class.impala::TupleRow"* %row) #20 {

 // entry:

 //   %dst_lowered_ptr = alloca { i64, i8* }

 //   %src_lowered_ptr = alloca { i8, double }

 //   %src = call { i8, double } @GetSlotRef(%"class.impala::ExprContext"* inttoptr

 //     (i64 120530832 to %"class.impala::ExprContext"*), %"class.impala::TupleRow"* %row)

 //   %0 = extractvalue { i8, double } %src, 0

 //   %is_null = trunc i8 %0 to i1

 //   br i1 %is_null, label %ret, label %src_not_null

 //

 // src_not_null:                                     ; preds = %entry

 //   %dst_slot_ptr = getelementptr inbounds

 //     { i8, %"struct.impala::StringValue" }* %agg_tuple, i32 0, i32 1

 //   call void @SetNotNull({ i8, %"struct.impala::StringValue" }* %agg_tuple)

 //   %dst_val = load %"struct.impala::StringValue"* %dst_slot_ptr

 //   store { i8, double } %src, { i8, double }* %src_lowered_ptr

 //   %src_unlowered_ptr = bitcast { i8, double }* %src_lowered_ptr

 //                        to %"struct.impala_udf::DoubleVal"*

 //   %ptr = extractvalue %"struct.impala::StringValue" %dst_val, 0

 //   %dst_stringval = insertvalue { i64, i8* } zeroinitializer, i8* %ptr, 1

 //   %len = extractvalue %"struct.impala::StringValue" %dst_val, 1

 //   %1 = extractvalue { i64, i8* } %dst_stringval, 0

 //   %2 = zext i32 %len to i64

 //   %3 = shl i64 %2, 32

 //   %4 = and i64 %1, 4294967295

 //   %5 = or i64 %4, %3

 //   %dst_stringval1 = insertvalue { i64, i8* } %dst_stringval, i64 %5, 0

 //   store { i64, i8* } %dst_stringval1, { i64, i8* }* %dst_lowered_ptr

 //   %dst_unlowered_ptr = bitcast { i64, i8* }* %dst_lowered_ptr

 //                        to %"struct.impala_udf::StringVal"*

 //   call void @HllUpdate(%"class.impala_udf::FunctionContext"* %fn_ctx,

 //                        %"struct.impala_udf::DoubleVal"* %src_unlowered_ptr,

 //                        %"struct.impala_udf::StringVal"* %dst_unlowered_ptr)

 //   %anyval_result = load { i64, i8* }* %dst_lowered_ptr

 //   %6 = extractvalue { i64, i8* } %anyval_result, 1

 //   %7 = insertvalue %"struct.impala::StringValue" zeroinitializer, i8* %6, 0

 //   %8 = extractvalue { i64, i8* } %anyval_result, 0

 //   %9 = ashr i64 %8, 32

 //   %10 = trunc i64 %9 to i32

 //   %11 = insertvalue %"struct.impala::StringValue" %7, i32 %10, 1

 //   store %"struct.impala::StringValue" %11, %"struct.impala::StringValue"* %dst_slot_ptr

 //   br label %ret

 //

 // ret:                                              ; preds = %src_not_null, %entry

 //   ret void

 // }

 llvm::Function* AggregationNode::CodegenUpdateSlot(

     RuntimeState* state, AggFnEvaluator* evaluator, SlotDescriptor* slot_desc) {

   DCHECK(slot_desc->is_materialized());

   LlvmCodeGen* codegen;

   if (!state->GetCodegen(&codegen).ok()) return NULL;


   DCHECK_EQ(evaluator->input_expr_ctxs().size(), 1);

   ExprContext* input_expr_ctx = evaluator->input_expr_ctxs()[0];

   Expr* input_expr = input_expr_ctx->root();

   // TODO: implement timestamp

   if (input_expr->type().type == TYPE_TIMESTAMP) return NULL;

   Function* agg_expr_fn;

   Status status = input_expr->GetCodegendComputeFn(state, &agg_expr_fn);

   if (!status.ok()) {

     VLOG_QUERY << "Could not codegen UpdateSlot(): " << status.GetDetail();

     return NULL;

   }

   DCHECK(agg_expr_fn != NULL);


   PointerType* fn_ctx_type =

       codegen->GetPtrType(FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME);

   StructType* tuple_struct = intermediate_tuple_desc_->GenerateLlvmStruct(codegen);

   PointerType* tuple_ptr_type = PointerType::get(tuple_struct, 0);

   PointerType* tuple_row_ptr_type = codegen->GetPtrType(TupleRow::LLVM_CLASS_NAME);


   // Create UpdateSlot prototype

   LlvmCodeGen::FnPrototype prototype(codegen, "UpdateSlot", codegen->void_type());

   prototype.AddArgument(LlvmCodeGen::NamedVariable("fn_ctx", fn_ctx_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("agg_tuple", tuple_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("row", tuple_row_ptr_type));


   LlvmCodeGen::LlvmBuilder builder(codegen->context());

   Value* args[3];

   Function* fn = prototype.GeneratePrototype(&builder, &args[0]);

   Value* fn_ctx_arg = args[0];

   Value* agg_tuple_arg = args[1];

   Value* row_arg = args[2];


   BasicBlock* src_not_null_block =

       BasicBlock::Create(codegen->context(), "src_not_null", fn);

   BasicBlock* ret_block = BasicBlock::Create(codegen->context(), "ret", fn);


   // Call expr function to get src slot value

   Value* ctx_arg = codegen->CastPtrToLlvmPtr(

       codegen->GetPtrType(ExprContext::LLVM_CLASS_NAME), input_expr_ctx);

   Value* agg_expr_fn_args[] = { ctx_arg, row_arg };

   CodegenAnyVal src = CodegenAnyVal::CreateCallWrapped(

       codegen, &builder, input_expr->type(), agg_expr_fn, agg_expr_fn_args, "src");


   Value* src_is_null = src.GetIsNull();

   builder.CreateCondBr(src_is_null, ret_block, src_not_null_block);


   // Src slot is not null, update dst_slot

   builder.SetInsertPoint(src_not_null_block);

   Value* dst_ptr =

       builder.CreateStructGEP(agg_tuple_arg, slot_desc->field_idx(), "dst_slot_ptr");

   Value* result = NULL;


   if (slot_desc->is_nullable()) {

     // Dst is NULL, just update dst slot to src slot and clear null bit

     Function* clear_null_fn = slot_desc->CodegenUpdateNull(codegen, tuple_struct, false);

     builder.CreateCall(clear_null_fn, agg_tuple_arg);

   }


   // Update the slot

   Value* dst_value = builder.CreateLoad(dst_ptr, "dst_val");

   switch (evaluator->agg_op()) {

     case AggFnEvaluator::COUNT:

       if (evaluator->is_merge()) {

         result = builder.CreateAdd(dst_value, src.GetVal(), "count_sum");

       } else {

         result = builder.CreateAdd(dst_value,

             codegen->GetIntConstant(TYPE_BIGINT, 1), "count_inc");

       }

       break;

     case AggFnEvaluator::MIN: {

       Function* min_fn = codegen->CodegenMinMax(slot_desc->type(), true);

       Value* min_args[] = { dst_value, src.GetVal() };

       result = builder.CreateCall(min_fn, min_args, "min_value");

       break;

     }

     case AggFnEvaluator::MAX: {

       Function* max_fn = codegen->CodegenMinMax(slot_desc->type(), false);

       Value* max_args[] = { dst_value, src.GetVal() };

       result = builder.CreateCall(max_fn, max_args, "max_value");

       break;

     }

     case AggFnEvaluator::SUM:

       if (slot_desc->type().type == TYPE_FLOAT || slot_desc->type().type == TYPE_DOUBLE) {

         result = builder.CreateFAdd(dst_value, src.GetVal());

       } else {

         result = builder.CreateAdd(dst_value, src.GetVal());

       }

       break;

     case AggFnEvaluator::NDV: {

       DCHECK_EQ(slot_desc->type().type, TYPE_STRING);

       IRFunction::Type ir_function_type = evaluator->is_merge() ? IRFunction::HLL_MERGE

                                           : GetHllUpdateFunction2(input_expr->type());

       Function* hll_fn = codegen->GetFunction(ir_function_type);


       // Create pointer to src_anyval to pass to HllUpdate() function. We must use the

       // unlowered type.

       Value* src_lowered_ptr = codegen->CreateEntryBlockAlloca(

           fn, LlvmCodeGen::NamedVariable("src_lowered_ptr", src.value()->getType()));

       builder.CreateStore(src.value(), src_lowered_ptr);

       Type* unlowered_ptr_type =

           CodegenAnyVal::GetUnloweredType(codegen, input_expr->type())->getPointerTo();

       Value* src_unlowered_ptr =

           builder.CreateBitCast(src_lowered_ptr, unlowered_ptr_type, "src_unlowered_ptr");


       // Create StringVal* intermediate argument from dst_value

       CodegenAnyVal dst_stringval = CodegenAnyVal::GetNonNullVal(

           codegen, &builder, TYPE_STRING, "dst_stringval");

       dst_stringval.SetFromRawValue(dst_value);

       // Create pointer to dst_stringval to pass to HllUpdate() function. We must use

       // the unlowered type.

       Value* dst_lowered_ptr = codegen->CreateEntryBlockAlloca(

           fn, LlvmCodeGen::NamedVariable("dst_lowered_ptr",

                                          dst_stringval.value()->getType()));

       builder.CreateStore(dst_stringval.value(), dst_lowered_ptr);

       unlowered_ptr_type =

           codegen->GetPtrType(CodegenAnyVal::GetUnloweredType(codegen, TYPE_STRING));

       Value* dst_unlowered_ptr =

           builder.CreateBitCast(dst_lowered_ptr, unlowered_ptr_type, "dst_unlowered_ptr");


       // Call 'hll_fn'

       builder.CreateCall3(hll_fn, fn_ctx_arg, src_unlowered_ptr, dst_unlowered_ptr);


       // Convert StringVal intermediate 'dst_arg' back to StringValue

       Value* anyval_result = builder.CreateLoad(dst_lowered_ptr, "anyval_result");

       result = CodegenAnyVal(codegen, &builder, TYPE_STRING, anyval_result)

                .ToNativeValue();

       break;

     }

     default:

       DCHECK(false) << "bad aggregate operator: " << evaluator->agg_op();

   }


   builder.CreateStore(result, dst_ptr);

   builder.CreateBr(ret_block);


   builder.SetInsertPoint(ret_block);

   builder.CreateRetVoid();


   return codegen->FinalizeFunction(fn);

 }


 // IR codegen for the UpdateTuple loop.  This loop is query specific and

 // based on the aggregate functions.  The function signature must match the non-

 // codegen'd UpdateTuple exactly.

 // For the query:

 // select count(*), count(int_col), sum(double_col) the IR looks like:

 //

 // define void @UpdateTuple(%"class.impala::AggregationNode"* %this_ptr,

 //                          %"class.impala::Tuple"* %agg_tuple,

 //                          %"class.impala::TupleRow"* %tuple_row) #20 {

 // entry:

 //   %tuple = bitcast %"class.impala::Tuple"* %agg_tuple to { i8, i64, i64, double }*

 //   %src_slot = getelementptr inbounds { i8, i64, i64, double }* %tuple, i32 0, i32 1

 //   %count_star_val = load i64* %src_slot

 //   %count_star_inc = add i64 %count_star_val, 1

 //   store i64 %count_star_inc, i64* %src_slot

 //   call void @UpdateSlot(%"class.impala_udf::FunctionContext"* inttoptr

 //                           (i64 44521296 to %"class.impala_udf::FunctionContext"*),

 //                         { i8, i64, i64, double }* %tuple,

 //                         %"class.impala::TupleRow"* %tuple_row)

 //   call void @UpdateSlot5(%"class.impala_udf::FunctionContext"* inttoptr

 //                            (i64 44521328 to %"class.impala_udf::FunctionContext"*),

 //                          { i8, i64, i64, double }* %tuple,

 //                          %"class.impala::TupleRow"* %tuple_row)

 //   ret void

 // }

 Function* AggregationNode::CodegenUpdateTuple(RuntimeState* state) {

   LlvmCodeGen* codegen;

   if (!state->GetCodegen(&codegen).ok()) return NULL;

   SCOPED_TIMER(codegen->codegen_timer());


   int j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1);

       ++j;

     }

     SlotDescriptor* slot_desc = intermediate_tuple_desc_->slots()[j];

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];


     // Timestamp and char are never supported. NDV supports decimal and string but no

     // other functions.

     // TODO: the other aggregate functions might work with decimal as-is

     if (slot_desc->type().type == TYPE_TIMESTAMP || slot_desc->type().type == TYPE_CHAR ||

         (evaluator->agg_op() != AggFnEvaluator::NDV &&

          (slot_desc->type().type == TYPE_DECIMAL ||

           slot_desc->type().type == TYPE_STRING ||

           slot_desc->type().type == TYPE_VARCHAR))) {

       VLOG_QUERY << "Could not codegen UpdateIntermediateTuple because "

                  << "string, char, timestamp and decimal are not yet supported.";

       return NULL;

     }


     // Don't codegen things that aren't builtins (for now)

     if (!evaluator->is_builtin()) return NULL;

   }


   if (intermediate_tuple_desc_->GenerateLlvmStruct(codegen) == NULL) {

     VLOG_QUERY << "Could not codegen UpdateTuple because we could"

                << "not generate a matching llvm struct for the intermediate tuple.";

     return NULL;

   }


   // Get the types to match the UpdateTuple signature

   Type* agg_node_type = codegen->GetType(AggregationNode::LLVM_CLASS_NAME);

   Type* agg_tuple_type = codegen->GetType(Tuple::LLVM_CLASS_NAME);

   Type* tuple_row_type = codegen->GetType(TupleRow::LLVM_CLASS_NAME);


   DCHECK(agg_node_type != NULL);

   DCHECK(agg_tuple_type != NULL);

   DCHECK(tuple_row_type != NULL);


   PointerType* agg_node_ptr_type = PointerType::get(agg_node_type, 0);

   PointerType* agg_tuple_ptr_type = PointerType::get(agg_tuple_type, 0);

   PointerType* tuple_row_ptr_type = PointerType::get(tuple_row_type, 0);


   // Signature for UpdateTuple is

   // void UpdateTuple(AggregationNode* this, Tuple* tuple, TupleRow* row)

   // This signature needs to match the non-codegen'd signature exactly.

   StructType* tuple_struct = intermediate_tuple_desc_->GenerateLlvmStruct(codegen);

   PointerType* tuple_ptr = PointerType::get(tuple_struct, 0);

   LlvmCodeGen::FnPrototype prototype(codegen, "UpdateTuple", codegen->void_type());

   prototype.AddArgument(LlvmCodeGen::NamedVariable("this_ptr", agg_node_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("agg_tuple", agg_tuple_ptr_type));

   prototype.AddArgument(LlvmCodeGen::NamedVariable("tuple_row", tuple_row_ptr_type));


   LlvmCodeGen::LlvmBuilder builder(codegen->context());

   Value* args[3];

   Function* fn = prototype.GeneratePrototype(&builder, &args[0]);


   // Cast the parameter types to the internal llvm runtime types.

   // TODO: get rid of this by using right type in function signature

   args[1] = builder.CreateBitCast(args[1], tuple_ptr, "tuple");


   // Loop over each expr and generate the IR for that slot.  If the expr is not

   // count(*), generate a helper IR function to update the slot and call that.

   j = probe_expr_ctxs_.size();

   for (int i = 0; i < aggregate_evaluators_.size(); ++i, ++j) {

     // skip non-materialized slots; we don't have evaluators instantiated for those

     while (!intermediate_tuple_desc_->slots()[j]->is_materialized()) {

       DCHECK_LT(j, intermediate_tuple_desc_->slots().size() - 1);

       ++j;

     }

     SlotDescriptor* slot_desc = intermediate_tuple_desc_->slots()[j];

     AggFnEvaluator* evaluator = aggregate_evaluators_[i];

     if (evaluator->is_count_star()) {

       // TODO: we should be able to hoist this up to the loop over the batch and just

       // increment the slot by the number of rows in the batch.

       int field_idx = slot_desc->field_idx();

       Value* const_one = codegen->GetIntConstant(TYPE_BIGINT, 1);

       Value* slot_ptr = builder.CreateStructGEP(args[1], field_idx, "src_slot");

       Value* slot_loaded = builder.CreateLoad(slot_ptr, "count_star_val");

       Value* count_inc = builder.CreateAdd(slot_loaded, const_one, "count_star_inc");

       builder.CreateStore(count_inc, slot_ptr);

     } else {

       Function* update_slot_fn = CodegenUpdateSlot(state, evaluator, slot_desc);

       if (update_slot_fn == NULL) return NULL;

       Value* fn_ctx_arg = codegen->CastPtrToLlvmPtr(

           codegen->GetPtrType(FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME),

           agg_fn_ctxs_[i]);

       builder.CreateCall3(update_slot_fn, fn_ctx_arg, args[1], args[2]);

     }

   }

   builder.CreateRetVoid();


   // CodegenProcessRowBatch() does the final optimizations.

   return codegen->FinalizeFunction(fn);

 }


 Function* AggregationNode::CodegenProcessRowBatch(

     RuntimeState* state, Function* update_tuple_fn) {

   LlvmCodeGen* codegen;

   if (!state->GetCodegen(&codegen).ok()) return NULL;

   SCOPED_TIMER(codegen->codegen_timer());

   DCHECK(update_tuple_fn != NULL);


   // Get the cross compiled update row batch function

   IRFunction::Type ir_fn = (!probe_expr_ctxs_.empty() ?

       IRFunction::AGG_NODE_PROCESS_ROW_BATCH_WITH_GROUPING :

       IRFunction::AGG_NODE_PROCESS_ROW_BATCH_NO_GROUPING);

   Function* process_batch_fn = codegen->GetFunction(ir_fn);


   if (process_batch_fn == NULL) {

     LOG(ERROR) << "Could not find AggregationNode::ProcessRowBatch in module.";

     return NULL;

   }


   int replaced = 0;

   if (!probe_expr_ctxs_.empty()) {

     // Aggregation w/o grouping does not use a hash table.


     // Codegen for hash

     Function* hash_fn = hash_tbl_->CodegenHashCurrentRow(state);

     if (hash_fn == NULL) return NULL;


     // Codegen HashTable::Equals

     Function* equals_fn = hash_tbl_->CodegenEquals(state);

     if (equals_fn == NULL) return NULL;


     // Codegen for evaluating build rows

     Function* eval_build_row_fn = hash_tbl_->CodegenEvalTupleRow(state, true);

     if (eval_build_row_fn == NULL) return NULL;


     // Codegen for evaluating probe rows

     Function* eval_probe_row_fn = hash_tbl_->CodegenEvalTupleRow(state, false);

     if (eval_probe_row_fn == NULL) return NULL;


     // Replace call sites

     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

         eval_build_row_fn, "EvalBuildRow", &replaced);

     DCHECK_EQ(replaced, 1);


     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

         eval_probe_row_fn, "EvalProbeRow", &replaced);

     DCHECK_EQ(replaced, 1);


     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

         hash_fn, "HashCurrentRow", &replaced);

     DCHECK_EQ(replaced, 2);


     process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

         equals_fn, "Equals", &replaced);

     DCHECK_EQ(replaced, 1);

   }


   process_batch_fn = codegen->ReplaceCallSites(process_batch_fn, false,

       update_tuple_fn, "UpdateTuple", &replaced);

   DCHECK_EQ(replaced, 1) << "One call site should be replaced.";

   DCHECK(process_batch_fn != NULL);

   return codegen->OptimizeFunctionWithExprs(process_batch_fn);

 }


 }

impala::AggregationNode::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: aggregation-node.h:61

impala::AggregationNode::output_tuple_desc_
TupleDescriptor * output_tuple_desc_
Definition: aggregation-node.h:89

row-batch.h

impala::DescriptorTbl
Definition: descriptors.h:338

impala::CodegenAnyVal::SetFromRawValue
void SetFromRawValue(llvm::Value *raw_val)
Definition: codegen-anyval.cc:458

agg-fn-evaluator.h

impala::AggFnEvaluator::is_builtin
bool is_builtin() const
Definition: agg-fn-evaluator.h:115

impala::ExecNode::AddRuntimeExecOption
void AddRuntimeExecOption(const std::string &option)
Appends option to 'runtime_exec_options_'.
Definition: exec-node.cc:188

impala::TYPE_DOUBLE
Definition: types.h:36

impala::CodegenAnyVal
Definition: codegen-anyval.h:52

impala::Status::GetDetail
const std::string GetDetail() const
Definition: status.cc:184

impala::CodegenAnyVal::CreateCallWrapped
static CodegenAnyVal CreateCallWrapped(LlvmCodeGen *cg, LlvmCodeGen::LlvmBuilder *builder, const ColumnType &type, llvm::Function *fn, llvm::ArrayRef< llvm::Value * > args, const char *name="", llvm::Value *result_ptr=NULL)
Same as above but wraps the result in a CodegenAnyVal.
Definition: codegen-anyval.cc:148

impala::Tuple::SetNull
void SetNull(const NullIndicatorOffset &offset)
Definition: tuple.h:101

impala::LlvmCodeGen::codegen_timer
RuntimeProfile::Counter * codegen_timer()
Definition: llvm-codegen.h:135

impala::LlvmCodeGen::GetPtrType
llvm::PointerType * GetPtrType(llvm::Type *type)
Return a pointer type to 'type'.

runtime-profile.h

impala::TYPE_CHAR
Definition: types.h:47

impala::ExecNode::num_rows_returned_
int64_t num_rows_returned_
Definition: exec-node.h:223

codegen-anyval.h

impala::AggregationNode::Prepare
virtual Status Prepare(RuntimeState *state)
Definition: aggregation-node.cc:85

slot-ref.h

impala::AggregationNode::build_expr_ctxs_
std::vector< ExprContext * > build_expr_ctxs_
Definition: aggregation-node.h:80

impala::AggFnEvaluator::SUM
Definition: agg-fn-evaluator.h:70

impala::ExecNode::mem_tracker
MemTracker * mem_tracker()
Definition: exec-node.h:162

impala::TYPE_VARCHAR
Definition: types.h:48

impala::AggregationNode::CodegenUpdateSlot
llvm::Function * CodegenUpdateSlot(RuntimeState *state, AggFnEvaluator *evaluator, SlotDescriptor *slot_desc)
Definition: aggregation-node.cc:506

impala::AggregationNode::AggregationNode
AggregationNode(ObjectPool *pool, const TPlanNode &tnode, const DescriptorTbl &descs)
Definition: aggregation-node.cc:56

impala::LlvmCodeGen::NamedVariable
Utility struct that wraps a variable name and llvm type.
Definition: llvm-codegen.h:149

impala::ExecNode::runtime_profile_
boost::scoped_ptr< RuntimeProfile > runtime_profile_
Definition: exec-node.h:225

impala::Expr::Open
static Status Open(const std::vector< ExprContext * > &ctxs, RuntimeState *state)
Convenience function for opening multiple expr trees.

impala::AggregationNode::build_timer_
RuntimeProfile::Counter * build_timer_
Time spent processing the child rows.
Definition: aggregation-node.h:111

impala::AggFnEvaluator
Definition: agg-fn-evaluator.h:62

old-hash-table.inline.h

impala::Tuple
A tuple with 0 materialised slots is represented as NULL.
Definition: tuple.h:48

impala::ExprValue::SetToMin
void * SetToMin(const ColumnType &type)
Sets the value for type to min and returns a pointer to the data.
Definition: expr-value.h:103

impala::CodegenAnyVal::GetUnloweredType
static llvm::Type * GetUnloweredType(LlvmCodeGen *cg, const ColumnType &type)
Definition: codegen-anyval.cc:69

RETURN_IF_ERROR
#define RETURN_IF_ERROR(stmt)
some generally useful macros
Definition: status.h:242

raw-value.h

impala::AggFnEvaluator::DebugString
std::string DebugString() const
Definition: agg-fn-evaluator.cc:518

impala::ExecNode::Init
virtual Status Init(const TPlanNode &tnode)
Definition: exec-node.cc:124

impala::AggregationNode::GetNext
virtual Status GetNext(RuntimeState *state, RowBatch *row_batch, bool *eos)
Definition: aggregation-node.cc:230

impala::RowBatch::GetRow
TupleRow * GetRow(int row_idx)
Definition: row-batch.h:140

impala::OldHashTable::Iterator::AtEnd
bool AtEnd() const
Returns true if this iterator is at the end, i.e. GetRow() cannot be called.
Definition: old-hash-table.h:293

impala::ExprValue
The materialized value returned by ExprContext::GetValue().
Definition: expr-value.h:25

impala::ExprContext
Definition: expr-context.h:40

ADD_TIMER
#define ADD_TIMER(profile, name)
Definition: runtime-profile.h:50

impala::AggregationNode::intermediate_tuple_id_
TupleId intermediate_tuple_id_
Tuple into which Update()/Merge()/Serialize() results are stored.
Definition: aggregation-node.h:83

expr-context.h

impala::RowBatch::AtCapacity
bool AtCapacity()
Definition: row-batch.h:120

impala::CodegenAnyVal::ToNativeValue
llvm::Value * ToNativeValue()
Definition: codegen-anyval.cc:507

impala::Tuple::GetSlot
void * GetSlot(int offset)
Definition: tuple.h:118

impala::AggFnEvaluator::is_count_star
bool is_count_star() const
Definition: agg-fn-evaluator.h:114

impala::AggFnEvaluator::NDV
Definition: agg-fn-evaluator.h:72

impala::RowDescriptor
Definition: descriptors.h:373

impala::TupleDescriptor::slots
const std::vector< SlotDescriptor * > & slots() const
Definition: descriptors.h:302

impala::TupleDescriptor::byte_size
int byte_size() const
Definition: descriptors.h:300

impala::ObjectPool
Definition: object-pool.h:30

llvm::IRBuilder
Definition: llvm-codegen.h:60

impala::AggFnEvaluator::MAX
Definition: agg-fn-evaluator.h:69

impala::AggFnEvaluator::Add
void Add(FunctionContext *agg_fn_ctx, TupleRow *src, Tuple *dst)
Definition: agg-fn-evaluator.h:238

impala::SlotDescriptor
Definition: descriptors.h:75

impala::AggFnEvaluator::is_merge
bool is_merge() const
Definition: agg-fn-evaluator.h:111

impala::AggFnEvaluator::Create
static Status Create(ObjectPool *pool, const TExpr &desc, AggFnEvaluator **result)
Definition: agg-fn-evaluator.cc:64

impala::TupleDescriptor::GenerateLlvmStruct
llvm::StructType * GenerateLlvmStruct(LlvmCodeGen *codegen)
Definition: descriptors.cc:556

impala::ExecNode::row_desc
const RowDescriptor & row_desc() const
Definition: exec-node.h:156

impala::Tuple::Create
static Tuple * Create(int size, MemPool *pool)
initialize individual tuple with data residing in mem pool
Definition: tuple.h:51

llvm-codegen.h

impala::TupleRow
Definition: tuple-row.h:28

impala::SlotDescriptor::null_indicator_offset
const NullIndicatorOffset & null_indicator_offset() const
Definition: descriptors.h:89

impala::ExecNode::ExecDebugAction
Status ExecDebugAction(TExecNodePhase::type phase, RuntimeState *state)
Definition: exec-node.cc:378

impala::ExecNode::ReachedLimit
bool ReachedLimit()
Definition: exec-node.h:159

impala::TYPE_TIMESTAMP
Definition: types.h:37

impala::AggregationNode::ConstructIntermediateTuple
Tuple * ConstructIntermediateTuple()
Definition: aggregation-node.cc:314

impala::ExprValue::SetToMax
void * SetToMax(const ColumnType &type)
Sets the value for type to max and returns a pointer to the data.
Definition: expr-value.h:137

impala::AggFnEvaluator::agg_op
AggregationOp agg_op() const
Definition: agg-fn-evaluator.h:112

impala::DescriptorTbl::GetTupleDescriptor
TupleDescriptor * GetTupleDescriptor(TupleId id) const
Definition: descriptors.cc:437

SCOPED_TIMER
#define SCOPED_TIMER(c)
Definition: runtime-profile.h:53

impala::CodegenAnyVal::GetNonNullVal
static CodegenAnyVal GetNonNullVal(LlvmCodeGen *codegen, LlvmCodeGen::LlvmBuilder *builder, const ColumnType &type, const char *name="")
Definition: codegen-anyval.cc:674

impala::AggregationNode::singleton_intermediate_tuple_
Tuple * singleton_intermediate_tuple_
Definition: aggregation-node.h:93

impala::Expr::Close
static void Close(const std::vector< ExprContext * > &ctxs, RuntimeState *state)
Convenience function for closing multiple expr trees.

impala::Tuple::IsNull
bool IsNull(const NullIndicatorOffset &offset) const
Definition: tuple.h:112

impala::AggregationNode::Reset
virtual Status Reset(RuntimeState *state)
Definition: aggregation-node.cc:273

impala::LlvmCodeGen
LLVM code generator. This is the top level object to generate jitted code.
Definition: llvm-codegen.h:107

impala::AggregationNode::CodegenUpdateTuple
llvm::Function * CodegenUpdateTuple(RuntimeState *state)
Codegen UpdateTuple(). Returns NULL if codegen is unsuccessful.
Definition: aggregation-node.cc:678

impala::SlotDescriptor::is_nullable
bool is_nullable() const
Definition: descriptors.h:93

impala::Status
Definition: status.h:81

impala::AggregationNode::ProcessRowBatchWithGrouping
void ProcessRowBatchWithGrouping(RowBatch *batch)
Definition: aggregation-node-ir.cc:34

impala::ExecNode::DebugString
std::string DebugString() const
Returns a string representation in DFS order of the plan rooted at this.
Definition: exec-node.cc:345

impala::ExecNode::expr_mem_tracker
MemTracker * expr_mem_tracker()
Definition: exec-node.h:163

impala::TupleRow::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: tuple-row.h:76

VLOG_QUERY
#define VLOG_QUERY
Definition: logging.h:57

impala::TYPE_INT
Definition: types.h:33

impala::ExprContext::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
Definition: expr-context.h:126

impala::ColumnType::type
PrimitiveType type
Definition: types.h:60

impala::LlvmCodeGen::CastPtrToLlvmPtr
llvm::Value * CastPtrToLlvmPtr(llvm::Type *type, const void *ptr)
Definition: llvm-codegen.cc:366

impala::LlvmCodeGen::FnPrototype::AddArgument
void AddArgument(const NamedVariable &var)
Add argument.
Definition: llvm-codegen.h:171

impala::AggregationNode::probe_expr_ctxs_
std::vector< ExprContext * > probe_expr_ctxs_
Exprs used to evaluate input rows.
Definition: aggregation-node.h:77

impala::MemPool
Definition: mem-pool.h:77

impala::Tuple::LLVM_CLASS_NAME
static const char * LLVM_CLASS_NAME
For C++/IR interop, we need to be able to look up types by name.
Definition: tuple.h:134

impala::RuntimeState
Definition: runtime-state.h:69

impala::AggFnEvaluator::Serialize
void Serialize(FunctionContext *agg_fn_ctx, Tuple *dst)
Definition: agg-fn-evaluator.h:248

impala::SlotDescriptor::type
const ColumnType & type() const
Definition: descriptors.h:78

impala::TYPE_SMALLINT
Definition: types.h:32

impala::RuntimeState::obj_pool
ObjectPool * obj_pool() const
Definition: runtime-state.h:92

impala::OldHashTable
The hash table does not support removes. The hash table is not thread safe.
Definition: old-hash-table.h:84

impala::FunctionContextImpl::LLVM_FUNCTIONCONTEXT_NAME
static const char * LLVM_FUNCTIONCONTEXT_NAME
Definition: udf-internal.h:93

impala::AggFnEvaluator::COUNT
Definition: agg-fn-evaluator.h:67

debug-util.h

RETURN_IF_CANCELLED
#define RETURN_IF_CANCELLED(state)
Definition: runtime-state.h:384

pool
ObjectPool pool
Definition: expr-benchmark.cc:89

aggregation-node.h

impala::AggFnEvaluator::Init
void Init(FunctionContext *agg_fn_ctx, Tuple *dst)
Functions for different phases of the aggregation.
Definition: agg-fn-evaluator.cc:314

string-value.inline.h

impala::ExecNode::Prepare
virtual Status Prepare(RuntimeState *state)
Definition: exec-node.cc:130

ADD_COUNTER
#define ADD_COUNTER(profile, name, unit)
Definition: runtime-profile.h:47

impala::OldHashTable::Iterator::GetTuple
Tuple * GetTuple()
Definition: old-hash-table.h:271

impala::AggregationNode::UpdateTuple
void UpdateTuple(Tuple *tuple, TupleRow *row)
Definition: aggregation-node.cc:369

impala::LlvmCodeGen::GetFunction
llvm::Function * GetFunction(IRFunction::Type)
Definition: llvm-codegen.cc:421

impala::AggregationNode::ProcessRowBatchNoGrouping
void ProcessRowBatchNoGrouping(RowBatch *batch)
Do the aggregation for all tuple rows in the batch.
Definition: aggregation-node-ir.cc:28

impala::AggregationNode::codegen_process_row_batch_fn_
llvm::Function * codegen_process_row_batch_fn_
IR for process row batch. NULL if codegen is disabled.
Definition: aggregation-node.h:98

impala::LlvmCodeGen::AddFunctionToJit
void AddFunctionToJit(llvm::Function *fn, void **fn_ptr)
Definition: llvm-codegen.cc:714

impala::SlotDescriptor::CodegenUpdateNull
llvm::Function * CodegenUpdateNull(LlvmCodeGen *, llvm::StructType *tuple, bool set_null)
Definition: descriptors.cc:510

impala::RawValue::Write
static void Write(const void *value, Tuple *tuple, const SlotDescriptor *slot_desc, MemPool *pool)
Definition: raw-value.cc:303

impala::ExecNode::QueryMaintenance
virtual Status QueryMaintenance(RuntimeState *state)
Definition: exec-node.cc:401

impala::Expr
This is the superclass of all expr evaluation nodes.
Definition: expr.h:116

impala::TYPE_BOOLEAN
Definition: types.h:30

VLOG_ROW
#define VLOG_ROW
Definition: logging.h:59

impala::RuntimeState::desc_tbl
const DescriptorTbl & desc_tbl() const
Definition: runtime-state.h:93

impala::TYPE_BIGINT
Definition: types.h:34

impala::ExecNode::is_closed
bool is_closed()
Definition: exec-node.h:242

impala::RowBatch::CommitLastRow
void CommitLastRow()
Definition: row-batch.h:109

impala::ExecNode::children_
std::vector< ExecNode * > children_
Definition: exec-node.h:214

runtime-state.h

impala::RowBatch
Definition: row-batch.h:66

COUNTER_SET
#define COUNTER_SET(c, v)
Definition: runtime-profile.h:56

count
uint64_t count
Definition: partitioning-throughput-test.cc:35

impala::RuntimeState::batch_size
int batch_size() const
Definition: runtime-state.h:98

impala::AggregationNode::Open
virtual Status Open(RuntimeState *state)
Definition: aggregation-node.cc:174

impala::RowBatch::tuple_data_pool
MemPool * tuple_data_pool()
Definition: row-batch.h:148

impala::ExecNode::rows_returned_counter_
RuntimeProfile::Counter * rows_returned_counter_
Definition: exec-node.h:226

impala::AggregationNode::aggregate_evaluators_
std::vector< AggFnEvaluator * > aggregate_evaluators_
Definition: aggregation-node.h:70

impala::OldHashTable::Iterator::Next
void IR_ALWAYS_INLINE Next()

impala::ExecNode::child
ExecNode * child(int i)
Definition: exec-node.h:241

impala::GetHllUpdateFunction2
IRFunction::Type GetHllUpdateFunction2(const ColumnType &type)
Definition: aggregation-node.cc:413

impala::TupleRow::SetTuple
void SetTuple(int tuple_idx, Tuple *tuple)
Definition: tuple-row.h:34

impala::Expr::type
const ColumnType & type() const
Definition: expr.h:145

impala::CodegenAnyVal::value
llvm::Value * value()
Returns the current type-lowered value.
Definition: codegen-anyval.h:135

impala::TYPE_NULL
Definition: types.h:29

impala::AggregationNode::needs_finalize_
bool needs_finalize_
Definition: aggregation-node.h:108

impala::RowBatch::AddRow
int AddRow()
Definition: row-batch.h:100

impala::RuntimeState::codegen_enabled
bool codegen_enabled() const
Returns true if codegen is enabled for this query.
Definition: runtime-state.h:183

impala::SlotRef
Reference to a single slot of a tuple.
Definition: slot-ref.h:23

impala::ColumnType
Definition: types.h:59

impala::CodegenAnyVal::GetVal
llvm::Value * GetVal(const char *name="val")
Definition: codegen-anyval.cc:258

impala::Status::OK
static const Status OK
Definition: status.h:87

impala::ExecNode::pool_
ObjectPool * pool_
Definition: exec-node.h:211

impala::Expr::GetCodegendComputeFn
virtual Status GetCodegendComputeFn(RuntimeState *state, llvm::Function **fn)=0

tuple.h

impala::LlvmCodeGen::GetType
llvm::Type * GetType(const ColumnType &type)
Returns llvm type for the column type.
Definition: llvm-codegen.cc:312

impala::AggregationNode::agg_fn_ctxs_
std::vector< impala_udf::FunctionContext * > agg_fn_ctxs_
FunctionContext for each agg fn and backing pool.
Definition: aggregation-node.h:73

expr.h

impala::RuntimeState::GetCodegen
Status GetCodegen(LlvmCodeGen **codegen, bool initialize=true)
Definition: runtime-state.cc:312

impala::SlotDescriptor::tuple_offset
int tuple_offset() const
Definition: descriptors.h:88

impala::AggregationNode::FinalizeTuple
Tuple * FinalizeTuple(Tuple *tuple, MemPool *pool)
Definition: aggregation-node.cc:374

mem-pool.h

impala::SlotDescriptor::field_idx
int field_idx() const
Returns the field index in the generated llvm struct for this slot's tuple.
Definition: descriptors.h:87

impala::CodegenAnyVal::GetIsNull
llvm::Value * GetIsNull(const char *name="is_null")
Gets the 'is_null' field of the *Val.
Definition: codegen-anyval.cc:171

impala::AggregationNode::output_tuple_id_
TupleId output_tuple_id_
Definition: aggregation-node.h:88

names.h

impala::LlvmCodeGen::GetIntConstant
llvm::Value * GetIntConstant(PrimitiveType type, int64_t val)
Returns the constant 'val' of 'type'.
Definition: llvm-codegen.cc:371

impala::ExecNode
Definition: exec-node.h:46

impala::ObjectPool::Add
T * Add(T *t)
Definition: object-pool.h:42

impala::Expr::CreateExprTrees
static Status CreateExprTrees(ObjectPool *pool, const std::vector< TExpr > &texprs, std::vector< ExprContext * > *ctxs)
Definition: expr.cc:149

impala::LlvmCodeGen::FinalizeFunction
llvm::Function * FinalizeFunction(llvm::Function *function)
Definition: llvm-codegen.cc:596

impala::ExecNode::EvalConjuncts
static bool EvalConjuncts(ExprContext *const *ctxs, int num_ctxs, TupleRow *row)
Definition: exec-node.cc:393

tuple-row.h

impala::SlotDescriptor::is_materialized
bool is_materialized() const
Definition: descriptors.h:92

impala::TYPE_STRING
Definition: types.h:38

impala::AggFnEvaluator::MIN
Definition: agg-fn-evaluator.h:68

impala::Expr::Prepare
static Status Prepare(const std::vector< ExprContext * > &ctxs, RuntimeState *state, const RowDescriptor &row_desc, MemTracker *tracker)

VLOG_FILE
#define VLOG_FILE
Definition: logging.h:58

impala::AggregationNode::output_iterator_
OldHashTable::Iterator output_iterator_
Definition: aggregation-node.h:68

VLOG_ROW_IS_ON
#define VLOG_ROW_IS_ON
Definition: logging.h:66

impala::AggregationNode::agg_fn_pool_
boost::scoped_ptr< MemPool > agg_fn_pool_
Definition: aggregation-node.h:74

impala::ExecNode::Open
virtual Status Open(RuntimeState *state)
Definition: exec-node.cc:154

impala::LlvmCodeGen::ReplaceCallSites
llvm::Function * ReplaceCallSites(llvm::Function *caller, bool update_in_place, llvm::Function *new_fn, const std::string &target_name, int *num_replaced)
Definition: llvm-codegen.cc:489

impala::AggregationNode::get_results_timer_
RuntimeProfile::Counter * get_results_timer_
Time spent returning the aggregated rows.
Definition: aggregation-node.h:113

impala::PrintRow
string PrintRow(TupleRow *row, const RowDescriptor &d)
Definition: debug-util.cc:192

impala::AggregationNode::hash_table_load_factor_counter_
RuntimeProfile::Counter * hash_table_load_factor_counter_
Load factor in hash table.
Definition: aggregation-node.h:117

impala::Status::ok
bool ok() const
Definition: status.h:172

impala::AggregationNode::process_row_batch_fn_
ProcessRowBatchFn process_row_batch_fn_
Jitted ProcessRowBatch function pointer. Null if codegen is disabled.
Definition: aggregation-node.h:102

impala::AggregationNode::intermediate_tuple_desc_
TupleDescriptor * intermediate_tuple_desc_
Definition: aggregation-node.h:84

impala::LlvmCodeGen::void_type
llvm::Type * void_type()
Definition: llvm-codegen.h:394

impala::AggregationNode::hash_table_buckets_counter_
RuntimeProfile::Counter * hash_table_buckets_counter_
Num buckets in hash table.
Definition: aggregation-node.h:115

impala::AggregationNode::tuple_pool_
boost::scoped_ptr< MemPool > tuple_pool_
Definition: aggregation-node.h:95

impala::ExecNode::conjunct_ctxs_
std::vector< ExprContext * > conjunct_ctxs_
Definition: exec-node.h:212

impala::TYPE_TINYINT
Definition: types.h:31

impala::ExecNode::Close
virtual void Close(RuntimeState *state)
Definition: exec-node.cc:166

impala::LlvmCodeGen::context
llvm::LLVMContext & context()
Definition: llvm-codegen.h:214

descriptors.h

impala::Expr::DebugString
virtual std::string DebugString() const
Definition: expr.cc:385

udf-internal.h

impala::LlvmCodeGen::OptimizeFunctionWithExprs
llvm::Function * OptimizeFunctionWithExprs(llvm::Function *fn)
Definition: llvm-codegen.cc:583

impala::TYPE_FLOAT
Definition: types.h:35

impala::AggregationNode::CodegenProcessRowBatch
llvm::Function * CodegenProcessRowBatch(RuntimeState *state, llvm::Function *update_tuple_fn)
Definition: aggregation-node.cc:782

impala::AggregationNode::Close
virtual void Close(RuntimeState *state)
Definition: aggregation-node.cc:278

impala::LlvmCodeGen::FnPrototype
Definition: llvm-codegen.h:161

impala::AggregationNode::hash_tbl_
boost::scoped_ptr< OldHashTable > hash_tbl_
Definition: aggregation-node.h:67

impala::TYPE_DECIMAL
Definition: types.h:42

impala::ExecNode::runtime_profile
RuntimeProfile * runtime_profile()
Definition: exec-node.h:161

impala::AggregationNode::Init
virtual Status Init(const TPlanNode &tnode)
Definition: aggregation-node.cc:72

impala::AggFnEvaluator::Finalize
void Finalize(FunctionContext *agg_fn_ctx, Tuple *src, Tuple *dst)
Definition: agg-fn-evaluator.h:252

impala::AggFnEvaluator::input_expr_ctxs
const std::vector< ExprContext * > & input_expr_ctxs() const
Definition: agg-fn-evaluator.h:113