doc/html/atod-benchmark_8cc_source.html

 // Copyright 2015 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #include <stdlib.h>

 #include <stdio.h>

 #include <iostream>

 #include <vector>

 #include <sstream>

 #include "runtime/string-value.h"

 #include "util/benchmark.h"

 #include "util/cpu-info.h"

 #include "util/string-parser.h"


 #include "common/names.h"


 using namespace impala;


 // Machine Info: Intel(R) Core(TM) i7-4790K CPU @ 4.00GHz

 // atod:                 Function     Rate (iters/ms)          Comparison

 //----------------------------------------------------------------------

 //               Impala Decimal4                84.6                  1X

 //               Impala Decimal8               49.77             0.5883X

 //              Impala Decimal16               17.08             0.2019X


 template <typename Decimal>

 struct TestData {

   int precision;

   int scale;

   double probability_negative;

   vector<StringValue> data;

   vector<string> memory;

   vector<Decimal> result;

 };


 double Rand() {

   return rand() / static_cast<double>(RAND_MAX);

 }


 template <typename Decimal>

 void AddTestData(TestData<Decimal>* data, const string& input) {

   data->memory.push_back(input);

   const string& str = data->memory.back();

   data->data.push_back(StringValue(const_cast<char*>(str.c_str()), str.length()));

 }


 template <typename Decimal>

 void AddTestData(TestData<Decimal>* data, int n) {

   int128_t max_whole = data->precision > data->scale ?

       DecimalUtil::GetScaleMultiplier<int128_t>(data->precision - data->scale) - 1 : 0;

   int128_t max_fraction = data->scale > 0 ?

       DecimalUtil::GetScaleMultiplier<int128_t>(data->scale) - 1 : 0;

   for (int i = 0; i < n; ++i) {

     stringstream ss;

     if (data->probability_negative > Rand()) ss << "-";

     if (max_whole > 0) ss << static_cast<int128_t>(max_whole * Rand());

     if (max_fraction > 0) ss << "." << static_cast<int128_t>(max_fraction * Rand());

     AddTestData(data, ss.str());

   }

 }


 template <typename Decimal, typename Storage>

 void TestImpala(int batch_size, void* d) {

   TestData<Decimal>* data = reinterpret_cast<TestData<Decimal>*>(d);

   ColumnType column_type = ColumnType::CreateDecimalType(data->precision, data->scale);

   Decimal val;

   for (int i = 0; i < batch_size; ++i) {

     int n = data->data.size();

     for (int j = 0; j < n; ++j) {

       const StringValue& str = data->data[j];

       StringParser::ParseResult dummy;

       val = StringParser::StringToDecimal<Storage>(

           str.ptr, str.len, column_type, &dummy);

       data->result[j] = val;

     }

   }

 }


 int main(int argc, char **argv) {

   CpuInfo::Init();

   cout << Benchmark::GetMachineInfo() << endl;


   Benchmark suite("atod");


   TestData<Decimal4Value> data4;

   data4.precision = ColumnType::MAX_DECIMAL4_PRECISION;

   data4.scale = data4.precision / 2;

   data4.probability_negative = 0.25;

   AddTestData(&data4, 1000);

   data4.result.resize(data4.data.size());

   suite.AddBenchmark("Impala Decimal4", TestImpala<Decimal4Value, int32_t>, &data4);


   TestData<Decimal8Value> data8;

   data8.precision = ColumnType::MAX_DECIMAL8_PRECISION;

   data8.scale = data8.precision / 2;

   data8.probability_negative = 0.25;

   AddTestData(&data8, 1000);

   data8.result.resize(data8.data.size());

   suite.AddBenchmark("Impala Decimal8", TestImpala<Decimal8Value, int64_t>, &data8);


   TestData<Decimal16Value> data16;

   data16.precision = ColumnType::MAX_PRECISION;

   data16.scale = data16.precision / 2;

   data16.probability_negative = 0.25;

   AddTestData(&data16, 1000);

   data16.result.resize(data16.data.size());

   suite.AddBenchmark("Impala Decimal16", TestImpala<Decimal16Value, int128_t>, &data16);


   cout << suite.Measure();

   return 0;

 }

TestData::memory
vector< string > memory
Definition: atod-benchmark.cc:42

TestData::probability_negative
double probability_negative
Definition: atod-benchmark.cc:40

impala::Benchmark::AddBenchmark
int AddBenchmark(const std::string &name, BenchmarkFunction fn, void *args, int baseline_idx=0)
Definition: benchmark.cc:70

impala::Benchmark
Definition: benchmark.h:31

impala::StringValue
Definition: string-value.h:33

impala::ColumnType::MAX_DECIMAL8_PRECISION
static const int MAX_DECIMAL8_PRECISION
The maximum precision representable by a 8-byte decimal (Decimal8Value)
Definition: types.h:77

AddTestData
void AddTestData(TestData< Decimal > *data, const string &input)
Definition: atod-benchmark.cc:51

impala::Benchmark::GetMachineInfo
static std::string GetMachineInfo()
Output machine/build configuration as a string.
Definition: benchmark.cc:124

impala::StringValue::len
int len
Definition: string-value.h:38

impala::Benchmark::Measure
std::string Measure()
Runs all the benchmarks and returns the result in a formatted string.
Definition: benchmark.cc:83

TestImpala
void TestImpala(int batch_size, void *d)
Definition: atod-benchmark.cc:73

TestData::precision
int precision
Definition: atod-benchmark.cc:38

string-parser.h

TestData
Definition: atod-benchmark.cc:37

impala::ColumnType::MAX_DECIMAL4_PRECISION
static const int MAX_DECIMAL4_PRECISION
The maximum precision representable by a 4-byte decimal (Decimal4Value)
Definition: types.h:75

impala::StringValue::ptr
char * ptr
Definition: string-value.h:37

impala::StringParser::ParseResult
ParseResult
Definition: string-parser.h:51

main
int main(int argc, char **argv)
Definition: atod-benchmark.cc:89

Rand
double Rand()
Definition: atod-benchmark.cc:46

TestData::data
vector< StringValue > data
Definition: atod-benchmark.cc:41

impala::ColumnType
Definition: types.h:59

TestData::scale
int scale
Definition: atod-benchmark.cc:39

TestData::result
vector< Decimal > result
Definition: atod-benchmark.cc:43

names.h

impala::CpuInfo::Init
static void Init()
Initialize CpuInfo.
Definition: cpu-info.cc:75

benchmark.h

impala::ColumnType::CreateDecimalType
static ColumnType CreateDecimalType(int precision, int scale)
Definition: types.h:103

string-value.h

impala::ColumnType::MAX_PRECISION
static const int MAX_PRECISION
Must be kept in sync with FE's max precision/scale.
Definition: types.h:71

cpu-info.h

impala::int128_t
__int128_t int128_t
We use the c++ int128_t type. This is stored using 16 bytes and very performant.
Definition: multi-precision.h:51