doc/html/data-stream-test_8cc_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #include <boost/thread/thread.hpp>

 #include <gtest/gtest.h>


 #include "common/init.h"

 #include "common/logging.h"

 #include "common/status.h"

 #include "codegen/llvm-codegen.h"

 #include "exprs/slot-ref.h"

 #include "rpc/auth-provider.h"

 #include "rpc/thrift-server.h"

 #include "runtime/row-batch.h"

 #include "runtime/runtime-state.h"

 #include "runtime/data-stream-mgr.h"

 #include "runtime/data-stream-sender.h"

 #include "runtime/data-stream-recvr.h"

 #include "runtime/descriptors.h"

 #include "runtime/client-cache.h"

 #include "runtime/raw-value.h"

 #include "service/fe-support.h"

 #include "util/cpu-info.h"

 #include "util/disk-info.h"

 #include "util/debug-util.h"

 #include "util/thread.h"

 #include "util/time.h"

 #include "util/mem-info.h"

 #include "util/test-info.h"

 #include "util/tuple-row-compare.h"

 #include "gen-cpp/ImpalaInternalService.h"

 #include "gen-cpp/ImpalaInternalService_types.h"

 #include "gen-cpp/Types_types.h"

 #include "gen-cpp/Descriptors_types.h"

 #include "service/fe-support.h"


 #include <iostream>


 #include "common/names.h"


 using namespace impala;

 using namespace apache::thrift;

 using namespace apache::thrift::protocol;


 DEFINE_int32(port, 20001, "port on which to run Impala test backend");

 DECLARE_string(principal);


 namespace impala {


 class ImpalaTestBackend : public ImpalaInternalServiceIf {

  public:

   ImpalaTestBackend(DataStreamMgr* stream_mgr): mgr_(stream_mgr) {}

   virtual ~ImpalaTestBackend() {}


   virtual void ExecPlanFragment(

       TExecPlanFragmentResult& return_val, const TExecPlanFragmentParams& params) {}


   virtual void ReportExecStatus(

       TReportExecStatusResult& return_val, const TReportExecStatusParams& params) {}


   virtual void CancelPlanFragment(

       TCancelPlanFragmentResult& return_val, const TCancelPlanFragmentParams& params) {}


   virtual void TransmitData(

       TTransmitDataResult& return_val, const TTransmitDataParams& params) {

     if (!params.eos) {

       mgr_->AddData(params.dest_fragment_instance_id, params.dest_node_id,

                     params.row_batch, params.sender_id).SetTStatus(&return_val);

     } else {

       mgr_->CloseSender(params.dest_fragment_instance_id, params.dest_node_id,

           params.sender_id).SetTStatus(&return_val);

     }

   }


  private:

   DataStreamMgr* mgr_;

 };


 class DataStreamTest : public testing::Test {

  protected:

   DataStreamTest()

     : runtime_state_(TPlanFragmentInstanceCtx(), "", &exec_env_),

       next_val_(0) {

     // Initialize Mem trackers for use by the data stream receiver.

     exec_env_.InitForFeTests();

     runtime_state_.InitMemTrackers(TUniqueId(), NULL, -1);

   }


   virtual void SetUp() {

     CreateRowDesc();

     CreateTupleComparator();

     CreateRowBatch();


     next_instance_id_.lo = 0;

     next_instance_id_.hi = 0;

     stream_mgr_ = new DataStreamMgr();


     broadcast_sink_.dest_node_id = DEST_NODE_ID;

     broadcast_sink_.output_partition.type = TPartitionType::UNPARTITIONED;


     random_sink_.dest_node_id = DEST_NODE_ID;

     random_sink_.output_partition.type = TPartitionType::RANDOM;


     hash_sink_.dest_node_id = DEST_NODE_ID;

     hash_sink_.output_partition.type = TPartitionType::HASH_PARTITIONED;

     // there's only one column to partition on

     TExprNode expr_node;

     expr_node.node_type = TExprNodeType::SLOT_REF;

     expr_node.type.types.push_back(TTypeNode());

     expr_node.type.types.back().__isset.scalar_type = true;

     expr_node.type.types.back().scalar_type.type = TPrimitiveType::BIGINT;

     expr_node.num_children = 0;

     TSlotRef slot_ref;

     slot_ref.slot_id = 0;

     expr_node.__set_slot_ref(slot_ref);

     TExpr expr;

     expr.nodes.push_back(expr_node);

     hash_sink_.output_partition.__isset.partition_exprs = true;

     hash_sink_.output_partition.partition_exprs.push_back(expr);


     // Ensure that individual sender info addresses don't change

     sender_info_.reserve(MAX_SENDERS);

     receiver_info_.reserve(MAX_RECEIVERS);

     StartBackend();

   }


   const TDataStreamSink& GetSink(TPartitionType::type partition_type) {

     switch (partition_type) {

       case TPartitionType::UNPARTITIONED: return broadcast_sink_;

       case TPartitionType::RANDOM: return random_sink_;

       case TPartitionType::HASH_PARTITIONED: return hash_sink_;

       default: DCHECK(false) << "Unhandled sink type: " << partition_type;

     }

     // Should never reach this.

     return broadcast_sink_;

   }


   virtual void TearDown() {

     lhs_slot_ctx_->Close(NULL);

     rhs_slot_ctx_->Close(NULL);

     exec_env_.impalad_client_cache()->TestShutdown();

     StopBackend();

   }


   void Reset() {

     sender_info_.clear();

     receiver_info_.clear();

     dest_.clear();

   }


   // We reserve contiguous memory for senders in SetUp. If a test uses more

   // senders, a DCHECK will fail and you should increase this value.

   static const int MAX_SENDERS = 16;

   static const int MAX_RECEIVERS = 16;

   static const PlanNodeId DEST_NODE_ID = 1;

   static const int BATCH_CAPACITY = 100;  // rows

   static const int PER_ROW_DATA = 8;

   static const int TOTAL_DATA_SIZE = 8 * 1024;

   static const int NUM_BATCHES = TOTAL_DATA_SIZE / BATCH_CAPACITY / PER_ROW_DATA;


   ObjectPool obj_pool_;

   MemTracker tracker_;

   DescriptorTbl* desc_tbl_;

   const RowDescriptor* row_desc_;

   TupleRowComparator* less_than_;

   MemTracker dummy_mem_tracker_;

   ExecEnv exec_env_;

   RuntimeState runtime_state_;

   TUniqueId next_instance_id_;

   string stmt_;


   // RowBatch generation

   scoped_ptr<RowBatch> batch_;

   int next_val_;

   int64_t* tuple_mem_;


   // receiving node

   DataStreamMgr* stream_mgr_;

   ThriftServer* server_;


   // sending node(s)

   TDataStreamSink broadcast_sink_;

   TDataStreamSink random_sink_;

   TDataStreamSink hash_sink_;

   vector<TPlanFragmentDestination> dest_;


   struct SenderInfo {

     thread* thread_handle;

     Status status;

     int num_bytes_sent;


     SenderInfo(): thread_handle(NULL), num_bytes_sent(0) {}

   };

   vector<SenderInfo> sender_info_;


   struct ReceiverInfo {

     TPartitionType::type stream_type;

     int num_senders;

     int receiver_num;


     thread* thread_handle;

     shared_ptr<DataStreamRecvr> stream_recvr;

     Status status;

     int num_rows_received;

     multiset<int64_t> data_values;


     ReceiverInfo(TPartitionType::type stream_type, int num_senders, int receiver_num)

       : stream_type(stream_type),

         num_senders(num_senders),

         receiver_num(receiver_num),

         thread_handle(NULL),

         num_rows_received(0) {}


     ~ReceiverInfo() {

       delete thread_handle;

       stream_recvr.reset();

     }

   };

   vector<ReceiverInfo> receiver_info_;


   // Create an instance id and add it to dest_

   void GetNextInstanceId(TUniqueId* instance_id) {

     dest_.push_back(TPlanFragmentDestination());

     TPlanFragmentDestination& dest = dest_.back();

     dest.fragment_instance_id = next_instance_id_;

     dest.server.hostname = "127.0.0.1";

     dest.server.port = FLAGS_port;

     *instance_id = next_instance_id_;

     ++next_instance_id_.lo;

   }


   // RowDescriptor to mimic "select bigint_col from alltypesagg", except the slot

   // isn't nullable

   void CreateRowDesc() {

     // create DescriptorTbl

     TTupleDescriptor tuple_desc;

     tuple_desc.__set_id(0);

     tuple_desc.__set_byteSize(8);

     tuple_desc.__set_numNullBytes(0);

     TDescriptorTable thrift_desc_tbl;

     thrift_desc_tbl.tupleDescriptors.push_back(tuple_desc);

     TSlotDescriptor slot_desc;

     slot_desc.__set_id(0);

     slot_desc.__set_parent(0);

     ColumnType type(TYPE_BIGINT);

     slot_desc.__set_slotType(type.ToThrift());

     slot_desc.__set_columnPath(vector<int>(1, 0));

     slot_desc.__set_byteOffset(0);

     slot_desc.__set_nullIndicatorByte(0);

     slot_desc.__set_nullIndicatorBit(-1);

     slot_desc.__set_slotIdx(0);

     slot_desc.__set_isMaterialized(true);

     thrift_desc_tbl.slotDescriptors.push_back(slot_desc);

     EXPECT_TRUE(DescriptorTbl::Create(&obj_pool_, thrift_desc_tbl, &desc_tbl_).ok());

     runtime_state_.set_desc_tbl(desc_tbl_);


     vector<TTupleId> row_tids;

     row_tids.push_back(0);

     vector<bool> nullable_tuples;

     nullable_tuples.push_back(false);

     row_desc_ = obj_pool_.Add(new RowDescriptor(*desc_tbl_, row_tids, nullable_tuples));

   }


   // Create a tuple comparator to sort in ascending order on the single bigint column.

   void CreateTupleComparator() {

     SlotRef* lhs_slot = obj_pool_.Add(new SlotRef(TYPE_BIGINT, 0));

     lhs_slot_ctx_ = obj_pool_.Add(new ExprContext(lhs_slot));

     SlotRef* rhs_slot = obj_pool_.Add(new SlotRef(TYPE_BIGINT, 0));

     rhs_slot_ctx_ = obj_pool_.Add(new ExprContext(rhs_slot));


     lhs_slot_ctx_->Prepare(NULL, *row_desc_, &tracker_);

     rhs_slot_ctx_->Prepare(NULL, *row_desc_, &tracker_);

     lhs_slot_ctx_->Open(NULL);

     rhs_slot_ctx_->Open(NULL);

     less_than_ = obj_pool_.Add(new TupleRowComparator(

         vector<ExprContext*>(1, lhs_slot_ctx_), vector<ExprContext*>(1, rhs_slot_ctx_),

         vector<bool>(1, true), vector<bool>(1, false)));

   }


   // Create batch_, but don't fill it with data yet. Assumes we created row_desc_.

   RowBatch* CreateRowBatch() {

     RowBatch* batch = new RowBatch(*row_desc_, BATCH_CAPACITY, &tracker_);

     int64_t* tuple_mem = reinterpret_cast<int64_t*>(

         batch->tuple_data_pool()->Allocate(BATCH_CAPACITY * 8));

     bzero(tuple_mem, BATCH_CAPACITY * 8);

     for (int i = 0; i < BATCH_CAPACITY; ++i) {

       int idx = batch->AddRow();

       TupleRow* row = batch->GetRow(idx);

       row->SetTuple(0, reinterpret_cast<Tuple*>(&tuple_mem[i]));

       batch->CommitLastRow();

     }

     return batch;

   }


   void GetNextBatch(RowBatch* batch, int* next_val) {

     for (int i = 0; i < BATCH_CAPACITY; ++i) {

       TupleRow* row = batch->GetRow(i);

       int64_t* val = reinterpret_cast<int64_t*>(row->GetTuple(0)->GetSlot(0));

       *val = (*next_val)++;

     }

   }


   // Start receiver (expecting given number of senders) in separate thread.

   void StartReceiver(TPartitionType::type stream_type, int num_senders, int receiver_num,

                      int buffer_size, bool is_merging, TUniqueId* out_id = NULL) {

     VLOG_QUERY << "start receiver";

     RuntimeProfile* profile =

         obj_pool_.Add(new RuntimeProfile(&obj_pool_, "TestReceiver"));

     TUniqueId instance_id;

     GetNextInstanceId(&instance_id);

     receiver_info_.push_back(ReceiverInfo(stream_type, num_senders, receiver_num));

     ReceiverInfo& info = receiver_info_.back();

     info.stream_recvr =

         stream_mgr_->CreateRecvr(&runtime_state_,

             *row_desc_, instance_id, DEST_NODE_ID, num_senders, buffer_size, profile,

             is_merging);

     if (!is_merging) {

       info.thread_handle = new thread(&DataStreamTest::ReadStream, this, &info);

     } else {

       info.thread_handle = new thread(&DataStreamTest::ReadStreamMerging, this, &info,

           profile);

     }

     if (out_id != NULL) *out_id = instance_id;

   }


   void JoinReceivers() {

     VLOG_QUERY << "join receiver\n";

     for (int i = 0; i < receiver_info_.size(); ++i) {

       receiver_info_[i].thread_handle->join();

       receiver_info_[i].stream_recvr->Close();

     }

   }


   // Deplete stream and print batches

   void ReadStream(ReceiverInfo* info) {

     RowBatch* batch;

     VLOG_QUERY <<  "start reading";

     while (!(info->status = info->stream_recvr->GetBatch(&batch)).IsCancelled() &&

         (batch != NULL)) {

       VLOG_QUERY << "read batch #rows=" << batch->num_rows();

       for (int i = 0; i < batch->num_rows(); ++i) {

         TupleRow* row = batch->GetRow(i);

         info->data_values.insert(*static_cast<int64_t*>(row->GetTuple(0)->GetSlot(0)));

       }

       SleepForMs(100);  // slow down receiver to exercise buffering logic

     }

     if (info->status.IsCancelled()) VLOG_QUERY << "reader is cancelled";

     VLOG_QUERY << "done reading";

   }


   void ReadStreamMerging(ReceiverInfo* info, RuntimeProfile* profile) {

     info->status = info->stream_recvr->CreateMerger(*less_than_);

     if (info->status.IsCancelled()) return;

     RowBatch batch(*row_desc_, 1024, &tracker_);

     VLOG_QUERY << "start reading merging";

     bool eos;

     while (!(info->status = info->stream_recvr->GetNext(&batch, &eos)).IsCancelled()) {

       VLOG_QUERY << "read batch #rows=" << batch.num_rows();

       for (int i = 0; i < batch.num_rows(); ++i) {

         TupleRow* row = batch.GetRow(i);

         info->data_values.insert(*static_cast<int64_t*>(row->GetTuple(0)->GetSlot(0)));

       }

       SleepForMs(100);

       batch.Reset();

       if (eos) break;

     }

     if (info->status.IsCancelled()) VLOG_QUERY << "reader is cancelled";

     VLOG_QUERY << "done reading";

   }


   // Verify correctness of receivers' data values.

   void CheckReceivers(TPartitionType::type stream_type, int num_senders) {

     int64_t total = 0;

     multiset<int64_t> all_data_values;

     for (int i = 0; i < receiver_info_.size(); ++i) {

       ReceiverInfo& info = receiver_info_[i];

       EXPECT_TRUE(info.status.ok());

       total += info.data_values.size();

       DCHECK_EQ(info.stream_type, stream_type);

       DCHECK_EQ(info.num_senders, num_senders);

       if (stream_type == TPartitionType::UNPARTITIONED) {

         EXPECT_EQ(

             NUM_BATCHES * BATCH_CAPACITY * num_senders, info.data_values.size());

       }

       all_data_values.insert(info.data_values.begin(), info.data_values.end());


       int k = 0;

       for (multiset<int64_t>::iterator j = info.data_values.begin();

            j != info.data_values.end(); ++j, ++k) {

         if (stream_type == TPartitionType::UNPARTITIONED) {

           // unpartitioned streams contain all values as many times as there are

           // senders

           EXPECT_EQ(k / num_senders, *j);

         } else if (stream_type == TPartitionType::HASH_PARTITIONED) {

           // hash-partitioned streams send values to the right partition

           int64_t value = *j;

           uint32_t hash_val =

               RawValue::GetHashValueFnv(&value, TYPE_BIGINT, HashUtil::FNV_SEED);

           EXPECT_EQ(hash_val % receiver_info_.size(), info.receiver_num);

         }

       }

     }


     if (stream_type == TPartitionType::HASH_PARTITIONED) {

       EXPECT_EQ(NUM_BATCHES * BATCH_CAPACITY * num_senders, total);


       int k = 0;

       for (multiset<int64_t>::iterator j = all_data_values.begin();

            j != all_data_values.end(); ++j, ++k) {

         // each sender sent all values

         EXPECT_EQ(k / num_senders, *j);

         if (k/num_senders != *j) break;

       }

     }

   }


   void CheckSenders() {

     for (int i = 0; i < sender_info_.size(); ++i) {

       EXPECT_TRUE(sender_info_[i].status.ok());

       EXPECT_GT(sender_info_[i].num_bytes_sent, 0);

     }

   }


   // Start backend in separate thread.

   void StartBackend() {

     shared_ptr<ImpalaTestBackend> handler(new ImpalaTestBackend(stream_mgr_));

     shared_ptr<TProcessor> processor(new ImpalaInternalServiceProcessor(handler));

     server_ = new ThriftServer("DataStreamTest backend", processor, FLAGS_port, NULL);

     server_->Start();

   }


   void StopBackend() {

     VLOG_QUERY << "stop backend\n";

     server_->StopForTesting();

     delete server_;

   }


   void StartSender(TPartitionType::type partition_type = TPartitionType::UNPARTITIONED,

                    int channel_buffer_size = 1024) {

     VLOG_QUERY << "start sender";

     int num_senders = sender_info_.size();

     DCHECK_LT(num_senders, MAX_SENDERS);

     sender_info_.push_back(SenderInfo());

     SenderInfo& info = sender_info_.back();

     info.thread_handle =

         new thread(&DataStreamTest::Sender, this, num_senders, channel_buffer_size,

                    partition_type);

   }


   void JoinSenders() {

     VLOG_QUERY << "join senders\n";

     for (int i = 0; i < sender_info_.size(); ++i) {

       sender_info_[i].thread_handle->join();

     }

   }


   void Sender(int sender_num, int channel_buffer_size,

               TPartitionType::type partition_type) {

     RuntimeState state(TPlanFragmentInstanceCtx(), "", &exec_env_);

     state.set_desc_tbl(desc_tbl_);

     state.InitMemTrackers(TUniqueId(), NULL, -1);

     VLOG_QUERY << "create sender " << sender_num;

     const TDataStreamSink& sink = GetSink(partition_type);

     DataStreamSender sender(

         &obj_pool_, sender_num, *row_desc_, sink, dest_, channel_buffer_size);

     EXPECT_TRUE(sender.Prepare(&state).ok());

     EXPECT_TRUE(sender.Open(&state).ok());

     scoped_ptr<RowBatch> batch(CreateRowBatch());

     SenderInfo& info = sender_info_[sender_num];

     int next_val = 0;

     for (int i = 0; i < NUM_BATCHES; ++i) {

       GetNextBatch(batch.get(), &next_val);

       VLOG_QUERY << "sender " << sender_num << ": #rows=" << batch->num_rows();

       info.status = sender.Send(&state, batch.get(), false);

       if (!info.status.ok()) break;

     }

     VLOG_QUERY << "closing sender" << sender_num;

     sender.Close(&state);

     info.num_bytes_sent = sender.GetNumDataBytesSent();


     batch->Reset();

   }


   void TestStream(TPartitionType::type stream_type, int num_senders,

                   int num_receivers, int buffer_size, bool is_merging) {

     VLOG_QUERY << "Testing stream=" << stream_type << " #senders=" << num_senders

                << " #receivers=" << num_receivers << " buffer_size=" << buffer_size

                << " is_merging=" << is_merging;

     Reset();

     for (int i = 0; i < num_receivers; ++i) {

       StartReceiver(stream_type, num_senders, i, buffer_size, is_merging);

     }

     for (int i = 0; i < num_senders; ++i) {

       StartSender(stream_type, buffer_size);

     }

     JoinSenders();

     CheckSenders();

     JoinReceivers();

     CheckReceivers(stream_type, num_senders);

   }


  private:

   ExprContext* lhs_slot_ctx_;

   ExprContext* rhs_slot_ctx_;

 };


 TEST_F(DataStreamTest, UnknownSenderSmallResult) {

   // starting a sender w/o a corresponding receiver does not result in an error because

   // we cannot distinguish whether a receiver was never created or the receiver

   // willingly tore down the stream

   // case 1: entire query result fits in single buffer, close() returns ok

   TUniqueId dummy_id;

   GetNextInstanceId(&dummy_id);

   StartSender(TPartitionType::UNPARTITIONED, TOTAL_DATA_SIZE + 1024);

   JoinSenders();

   EXPECT_TRUE(sender_info_[0].status.ok());

   EXPECT_GT(sender_info_[0].num_bytes_sent, 0);

 }


 TEST_F(DataStreamTest, UnknownSenderLargeResult) {

   // case 2: query result requires multiple buffers, send() returns ok

   TUniqueId dummy_id;

   GetNextInstanceId(&dummy_id);

   StartSender();

   JoinSenders();

   EXPECT_TRUE(sender_info_[0].status.ok());

   EXPECT_GT(sender_info_[0].num_bytes_sent, 0);

 }


 TEST_F(DataStreamTest, Cancel) {

   TUniqueId instance_id;

   StartReceiver(TPartitionType::UNPARTITIONED, 1, 1, 1024, false, &instance_id);

   stream_mgr_->Cancel(instance_id);

   StartReceiver(TPartitionType::UNPARTITIONED, 1, 1, 1024, true, &instance_id);

   stream_mgr_->Cancel(instance_id);

   JoinReceivers();

   EXPECT_TRUE(receiver_info_[0].status.IsCancelled());

   EXPECT_TRUE(receiver_info_[1].status.IsCancelled());

 }


 TEST_F(DataStreamTest, BasicTest) {

   // TODO: also test that all client connections have been returned

   TPartitionType::type stream_types[] =

       {TPartitionType::UNPARTITIONED, TPartitionType::RANDOM,

           TPartitionType::HASH_PARTITIONED};

   int sender_nums[] = {1, 4};

   int receiver_nums[] = {1, 4};

   int buffer_sizes[] = {1024, 1024 * 1024};

   bool merging[] = {false, true};

   for (int i = 0; i < sizeof(stream_types) / sizeof(*stream_types); ++i) {

     for (int j = 0; j < sizeof(sender_nums) / sizeof(int); ++j) {

       for (int k = 0; k < sizeof(receiver_nums) / sizeof(int); ++k) {

         for (int l = 0; l < sizeof(buffer_sizes) / sizeof(int); ++l) {

           for (int m = 0; m < sizeof(merging) / sizeof(bool); ++m) {

             TestStream(stream_types[i], sender_nums[j], receiver_nums[k],

                        buffer_sizes[l], merging[m]);

           }

         }

       }

     }

   }

 }


 // TODO: more tests:

 // - test case for transmission error in last batch

 // - receivers getting created concurrently


 }


 int main(int argc, char **argv) {

   ::testing::InitGoogleTest(&argc, argv);

   InitCommonRuntime(argc, argv, true, TestInfo::BE_TEST);

   InitFeSupport();

   impala::LlvmCodeGen::InitializeLlvm();

   return RUN_ALL_TESTS();

 }

impala::DataStreamTest
Definition: data-stream-test.cc:90

impala::DataStreamTest::StartReceiver
void StartReceiver(TPartitionType::type stream_type, int num_senders, int receiver_num, int buffer_size, bool is_merging, TUniqueId *out_id=NULL)
Definition: data-stream-test.cc:315

row-batch.h

impala::DescriptorTbl
Definition: descriptors.h:338

impala::DataStreamTest::SenderInfo::num_bytes_sent
int num_bytes_sent
Definition: data-stream-test.cc:201

impala::DataStreamTest::next_instance_id_
TUniqueId next_instance_id_
Definition: data-stream-test.cc:180

impala::DataStreamTest::dest_
vector< TPlanFragmentDestination > dest_
Definition: data-stream-test.cc:196

impala::DataStreamTest::ReceiverInfo::num_rows_received
int num_rows_received
Definition: data-stream-test.cc:215

impala::DataStreamTest::ReceiverInfo::data_values
multiset< int64_t > data_values
Definition: data-stream-test.cc:216

impala::RowBatch::num_rows
int num_rows() const
Definition: row-batch.h:215

impala::DataStreamTest::SenderInfo::status
Status status
Definition: data-stream-test.cc:200

impala::DataStreamTest::stream_mgr_
DataStreamMgr * stream_mgr_
Definition: data-stream-test.cc:189

init.h

impala::PlanNodeId
int PlanNodeId
Definition: global-types.h:26

impala::InitFeSupport
void InitFeSupport()
Definition: fe-support.cc:346

impala::DataStreamTest::ReceiverInfo::~ReceiverInfo
~ReceiverInfo()
Definition: data-stream-test.cc:225

impala::TupleRowComparator
Definition: tuple-row-compare.h:27

impala::TEST_F
TEST_F(InstructionCounterTest, Count)
Definition: instruction-counter-test.cc:69

impala::TupleRow::GetTuple
Tuple * GetTuple(int tuple_idx)
Definition: tuple-row.h:30

impala::ClientCache::TestShutdown
void TestShutdown()
For testing only: shutdown all clients.
Definition: client-cache.h:287

impala::protocol
const StringSearch UrlParser::protocol_search & protocol
Definition: url-parser.cc:36

slot-ref.h

impala::DataStreamTest::CheckReceivers
void CheckReceivers(TPartitionType::type stream_type, int num_senders)
Definition: data-stream-test.cc:383

time.h

impala::ExecEnv::InitForFeTests
Status InitForFeTests()
Initializes the exec env for running FE tests.
Definition: exec-env.cc:276

impala::DataStreamTest::StartBackend
void StartBackend()
Definition: data-stream-test.cc:436

impala::obj_pool_
boost::scoped_ptr< ObjectPool > obj_pool_
Object pool owned by the coordinator. Any executor will have its own pool.
Definition: coordinator.h:296

impala::DataStreamTest::SenderInfo::SenderInfo
SenderInfo()
Definition: data-stream-test.cc:203

impala::RuntimeState::InitMemTrackers
void InitMemTrackers(const TUniqueId &query_id, const std::string *request_pool, int64_t query_bytes_limit, int64_t query_rm_reservation_limit_bytes=-1)
Definition: runtime-state.cc:152

impala::DataStreamTest::GetSink
const TDataStreamSink & GetSink(TPartitionType::type partition_type)
Definition: data-stream-test.cc:138

impala::DataStreamTest::ReceiverInfo::stream_type
TPartitionType::type stream_type
Definition: data-stream-test.cc:208

impala::DataStreamTest::CreateRowBatch
RowBatch * CreateRowBatch()
Definition: data-stream-test.cc:292

impala::DataStreamTest::DataStreamTest
DataStreamTest()
Definition: data-stream-test.cc:92

impala::DataStreamTest::runtime_state_
RuntimeState runtime_state_
Definition: data-stream-test.cc:179

raw-value.h

impala::RuntimeState::set_desc_tbl
void set_desc_tbl(DescriptorTbl *desc_tbl)
Definition: runtime-state.h:94

impala::InitCommonRuntime
void InitCommonRuntime(int argc, char **argv, bool init_jvm, TestInfo::Mode m=TestInfo::NON_TEST)
Definition: init.cc:122

impala::RowBatch::GetRow
TupleRow * GetRow(int row_idx)
Definition: row-batch.h:140

impala::DataStreamTest::JoinReceivers
void JoinReceivers()
Definition: data-stream-test.cc:337

impala::ExprContext
Definition: expr-context.h:40

impala::ImpalaTestBackend::mgr_
DataStreamMgr * mgr_
Definition: data-stream-test.cc:87

data-stream-mgr.h

impala::DataStreamTest::ReadStreamMerging
void ReadStreamMerging(ReceiverInfo *info, RuntimeProfile *profile)
Definition: data-stream-test.cc:362

impala::ImpalaTestBackend
Definition: data-stream-test.cc:61

impala::DataStreamTest::Reset
void Reset()
Definition: data-stream-test.cc:156

impala::DataStreamTest::ReceiverInfo::thread_handle
thread * thread_handle
Definition: data-stream-test.cc:212

impala::DataStreamTest::rhs_slot_ctx_
ExprContext * rhs_slot_ctx_
Definition: data-stream-test.cc:515

impala::DataStreamSender::Prepare
virtual Status Prepare(RuntimeState *state)
Definition: data-stream-sender.cc:362

mem-info.h

impala::DataStreamTest::TestStream
void TestStream(TPartitionType::type stream_type, int num_senders, int num_receivers, int buffer_size, bool is_merging)
Definition: data-stream-test.cc:495

impala::DataStreamTest::ReceiverInfo::num_senders
int num_senders
Definition: data-stream-test.cc:209

impala::desc_tbl_
TDescriptorTable desc_tbl_
copied from TQueryExecRequest; constant across all fragments
Definition: coordinator.h:197

impala::Tuple::GetSlot
void * GetSlot(int offset)
Definition: tuple.h:118

impala::RowDescriptor
Definition: descriptors.h:373

client-cache.h

impala::ObjectPool
Definition: object-pool.h:30

impala::DataStreamTest::ReceiverInfo::stream_recvr
shared_ptr< DataStreamRecvr > stream_recvr
Definition: data-stream-test.cc:213

impala::DataStreamTest::broadcast_sink_
TDataStreamSink broadcast_sink_
Definition: data-stream-test.cc:193

impala::DataStreamTest::GetNextBatch
void GetNextBatch(RowBatch *batch, int *next_val)
Definition: data-stream-test.cc:306

impala::DataStreamSender::Open
virtual Status Open(RuntimeState *state)
Definition: data-stream-sender.cc:397

llvm-codegen.h

impala::DataStreamTest::tracker_
MemTracker tracker_
Definition: data-stream-test.cc:173

logging.h

impala::TupleRow
Definition: tuple-row.h:28

impala::Cancel
void Cancel(const Status *cause=NULL)

impala::DataStreamTest::exec_env_
ExecEnv exec_env_
Definition: data-stream-test.cc:178

impala::SleepForMs
void SleepForMs(const int64_t duration_ms)
Sleeps the current thread for at least duration_ms milliseconds.
Definition: time.cc:21

impala::DataStreamTest::CheckSenders
void CheckSenders()
Definition: data-stream-test.cc:428

impala::DataStreamMgr
Definition: data-stream-mgr.h:56

impala::DataStreamTest::TearDown
virtual void TearDown()
Definition: data-stream-test.cc:149

impala::RawValue::GetHashValueFnv
static uint32_t GetHashValueFnv(const void *v, const ColumnType &type, uint32_t seed)
Definition: raw-value.h:196

impala::DataStreamTest::lhs_slot_ctx_
ExprContext * lhs_slot_ctx_
Definition: data-stream-test.cc:514

DECLARE_string
DECLARE_string(principal)

impala::ImpalaTestBackend::ExecPlanFragment
virtual void ExecPlanFragment(TExecPlanFragmentResult &return_val, const TExecPlanFragmentParams &params)
Definition: data-stream-test.cc:66

impala::ImpalaTestBackend::ImpalaTestBackend
ImpalaTestBackend(DataStreamMgr *stream_mgr)
Definition: data-stream-test.cc:63

thread.h

impala::DataStreamTest::dummy_mem_tracker_
MemTracker dummy_mem_tracker_
Definition: data-stream-test.cc:177

impala::Status
Definition: status.h:81

impala::DataStreamTest::stmt_
string stmt_
Definition: data-stream-test.cc:181

VLOG_QUERY
#define VLOG_QUERY
Definition: logging.h:57

impala::DataStreamTest::server_
ThriftServer * server_
Definition: data-stream-test.cc:190

impala::ImpalaTestBackend::~ImpalaTestBackend
virtual ~ImpalaTestBackend()
Definition: data-stream-test.cc:64

impala::ImpalaTestBackend::CancelPlanFragment
virtual void CancelPlanFragment(TCancelPlanFragmentResult &return_val, const TCancelPlanFragmentParams &params)
Definition: data-stream-test.cc:72

impala::DataStreamTest::Sender
void Sender(int sender_num, int channel_buffer_size, TPartitionType::type partition_type)
Definition: data-stream-test.cc:468

auth-provider.h

impala::RowBatch::Reset
void Reset()
Resets the row batch, returning all resources it has accumulated.
Definition: row-batch.cc:224

impala::RuntimeState
Definition: runtime-state.h:69

impala::DataStreamTest::SenderInfo
Definition: data-stream-test.cc:198

impala::Status::IsCancelled
bool IsCancelled() const
Definition: status.h:174

impala::DataStreamSender
Definition: data-stream-sender.h:46

impala::DataStreamSender::Send
virtual Status Send(RuntimeState *state, RowBatch *batch, bool eos)
Definition: data-stream-sender.cc:401

impala::DataStreamTest::ReceiverInfo
Definition: data-stream-test.cc:207

impala::DataStreamTest::CreateTupleComparator
void CreateTupleComparator()
Definition: data-stream-test.cc:276

impala::DataStreamTest::hash_sink_
TDataStreamSink hash_sink_
Definition: data-stream-test.cc:195

debug-util.h

thrift-server.h

impala::DataStreamTest::StartSender
void StartSender(TPartitionType::type partition_type=TPartitionType::UNPARTITIONED, int channel_buffer_size=1024)
Definition: data-stream-test.cc:449

impala::DataStreamTest::ReadStream
void ReadStream(ReceiverInfo *info)
Definition: data-stream-test.cc:346

impala::DataStreamSender::GetNumDataBytesSent
int64_t GetNumDataBytesSent() const
Definition: data-stream-sender.cc:469

impala::DataStreamTest::random_sink_
TDataStreamSink random_sink_
Definition: data-stream-test.cc:194

impala::DataStreamTest::receiver_info_
vector< ReceiverInfo > receiver_info_
Definition: data-stream-test.cc:230

impala::ImpalaTestBackend::ReportExecStatus
virtual void ReportExecStatus(TReportExecStatusResult &return_val, const TReportExecStatusParams &params)
Definition: data-stream-test.cc:69

impala::DataStreamTest::less_than_
TupleRowComparator * less_than_
Definition: data-stream-test.cc:176

impala::DataStreamTest::next_val_
int next_val_
Definition: data-stream-test.cc:185

impala::DataStreamTest::SenderInfo::thread_handle
thread * thread_handle
Definition: data-stream-test.cc:199

impala::ThriftServer
Definition: thrift-server.h:39

impala::DataStreamSender::Close
virtual void Close(RuntimeState *state)
Definition: data-stream-sender.cc:450

data-stream-recvr.h

impala::TYPE_BIGINT
Definition: types.h:34

impala::MemTracker
This class is thread-safe.
Definition: mem-tracker.h:61

impala::RowBatch::CommitLastRow
void CommitLastRow()
Definition: row-batch.h:109

impala::DataStreamTest::StopBackend
void StopBackend()
Definition: data-stream-test.cc:443

impala::DataStreamTest::ReceiverInfo::ReceiverInfo
ReceiverInfo(TPartitionType::type stream_type, int num_senders, int receiver_num)
Definition: data-stream-test.cc:218

runtime-state.h

impala::RowBatch
Definition: row-batch.h:66

impala::DataStreamTest::tuple_mem_
int64_t * tuple_mem_
Definition: data-stream-test.cc:186

impala::DataStreamTest::CreateRowDesc
void CreateRowDesc()
Definition: data-stream-test.cc:245

impala::RowBatch::tuple_data_pool
MemPool * tuple_data_pool()
Definition: row-batch.h:148

impala::ImpalaTestBackend::TransmitData
virtual void TransmitData(TTransmitDataResult &return_val, const TTransmitDataParams &params)
Definition: data-stream-test.cc:75

impala::HashUtil::FNV_SEED
static const uint32_t FNV_SEED
Definition: hash-util.h:99

Test
uint64_t Test(T *ht, const ProbeTuple *input, uint64_t num_tuples)
Definition: cache-hash-test.cc:67

ImpalaInternalServiceIf

status.h

impala::RuntimeProfile
Definition: runtime-profile.h:83

impala::TupleRow::SetTuple
void SetTuple(int tuple_idx, Tuple *tuple)
Definition: tuple-row.h:34

impala::LlvmCodeGen::InitializeLlvm
static void InitializeLlvm(bool load_backend=false)
Definition: llvm-codegen.cc:78

impala::DataStreamTest::obj_pool_
ObjectPool obj_pool_
Definition: data-stream-test.cc:172

impala::DataStreamTest::sender_info_
vector< SenderInfo > sender_info_
Definition: data-stream-test.cc:205

impala::DataStreamTest::batch_
scoped_ptr< RowBatch > batch_
Definition: data-stream-test.cc:184

impala::RowBatch::AddRow
int AddRow()
Definition: row-batch.h:100

impala::DataStreamTest::GetNextInstanceId
void GetNextInstanceId(TUniqueId *instance_id)
Definition: data-stream-test.cc:233

impala::SlotRef
Reference to a single slot of a tuple.
Definition: slot-ref.h:23

impala::DataStreamTest::desc_tbl_
DescriptorTbl * desc_tbl_
Definition: data-stream-test.cc:174

data-stream-sender.h

impala::ColumnType
Definition: types.h:59

impala::DataStreamTest::JoinSenders
void JoinSenders()
Definition: data-stream-test.cc:461

impala::row_desc_
const RowDescriptor * row_desc_
owned by plan root, which resides in runtime_state_'s pool
Definition: coordinator.h:255

main
int main(int argc, char **argv)
Definition: data-stream-test.cc:581

impala::DescriptorTbl::Create
static Status Create(ObjectPool *pool, const TDescriptorTable &thrift_tbl, DescriptorTbl **tbl)
Definition: descriptors.cc:378

impala::exec_env_
ExecEnv * exec_env_
Definition: coordinator.h:193

names.h

impala::DEFINE_int32
DEFINE_int32(periodic_counter_update_period_ms, 500,"Period to update rate counters and"" sampling counters in ms")

disk-info.h

impala::ColumnType::ToThrift
TColumnType ToThrift() const
Definition: types.h:147

impala::ExecEnv
Definition: exec-env.h:53

impala::TestInfo::BE_TEST
Definition: test-info.h:26

gen_ir_descriptions.idx
int idx
Definition: gen_ir_descriptions.py:215

impala::DataStreamTest::row_desc_
const RowDescriptor * row_desc_
Definition: data-stream-test.cc:175

impala::DataStreamTest::SetUp
virtual void SetUp()
Definition: data-stream-test.cc:100

impala::Status::ok
bool ok() const
Definition: status.h:172

impala::DataStreamTest::ReceiverInfo::receiver_num
int receiver_num
Definition: data-stream-test.cc:210

tuple-row-compare.h

descriptors.h

impala::DataStreamTest::ReceiverInfo::status
Status status
Definition: data-stream-test.cc:214

impala::MemPool::Allocate
uint8_t * Allocate(int size)
Definition: mem-pool.h:92

fe-support.h

cpu-info.h

test-info.h

impala::ExecEnv::impalad_client_cache
ImpalaInternalServiceClientCache * impalad_client_cache()
Definition: exec-env.h:76