doc/html/decimal-util_8h_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #ifndef IMPALA_UTIL_DECIMAL_UTIL_H

 #define IMPALA_UTIL_DECIMAL_UTIL_H


 #include <ostream>

 #include <string>

 #include <boost/cstdint.hpp>


 #include "runtime/types.h"

 #include "runtime/multi-precision.h"

 #include "util/bit-util.h"


 namespace impala {


 class DecimalUtil {

  public:

   static int128_t MAX_UNSCALED_DECIMAL;


   static void InitMaxUnscaledDecimal();


   template<typename T>

   static T MultiplyByScale(const T& v, const ColumnType& t) {

     DCHECK(t.type == TYPE_DECIMAL);

     return MultiplyByScale(v, t.scale);

   }


   template<typename T>

   static T MultiplyByScale(const T& v, int scale) {

     return v * GetScaleMultiplier<T>(scale);

   }


   template<typename T>

   static T GetScaleMultiplier(int scale) {

     DCHECK_GE(scale, 0);

     T result = 1;

     for (int i = 0; i < scale; ++i) {

       result *= 10;

     }

     return result;

   }


   template<typename T>

   static inline void EncodeToFixedLenByteArray(

       uint8_t* buffer, int fixed_len_size, const T& v) {

     DCHECK_GT(fixed_len_size, 0);

     DCHECK_LE(fixed_len_size, sizeof(T));


 #if __BYTE_ORDER == __LITTLE_ENDIAN

     BitUtil::ByteSwap(buffer, &v, fixed_len_size);

 #else

     memcpy(buffer, &v + sizeof(T) - fixed_len_size, fixed_len_size);

 #endif


 #ifndef NDEBUG

 #if __BYTE_ORDER == __LITTLE_ENDIAN

     const int8_t* skipped_bytes_start = reinterpret_cast<const int8_t*>(&v) +

         fixed_len_size;

 #else

     const int8_t* skipped_bytes_start = reinterpret_cast<const int8_t*>(&v);

 #endif

     // On debug, verify that the skipped bytes are what we expect.

     for (int i = 0; i < sizeof(T) - fixed_len_size; ++i) {

       DCHECK_EQ(skipped_bytes_start[i], v.value() < 0 ? -1 : 0);

     }

 #endif

   }


   template<typename T>

   static inline void DecodeFromFixedLenByteArray(

       const uint8_t* buffer, int fixed_len_size, T* v) {

     DCHECK_GT(fixed_len_size, 0);

     DCHECK_LE(fixed_len_size, sizeof(T));

     *v = 0;

     // We need to sign extend val. For example, if the original value was

     // -1, the original bytes were -1,-1,-1,-1. If we only wrote out 1 byte, after

     // the encode step above, val would contain (-1, 0, 0, 0). We need to sign

     // extend the remaining 3 bytes to get the original value.

     // We do this by filling in the most significant bytes and (arithmetic) bit

     // shifting down.

     int bytes_to_fill = sizeof(T) - fixed_len_size;

 #if __BYTE_ORDER == __LITTLE_ENDIAN

     BitUtil::ByteSwap(reinterpret_cast<int8_t*>(v) + bytes_to_fill, buffer, fixed_len_size);

 #else

     memcpy(v, buffer, fixed_len_size);

 #endif

     v->value() >>= (bytes_to_fill * 8);

   }

 };


 template <>

 inline int32_t DecimalUtil::GetScaleMultiplier<int32_t>(int scale) {

   DCHECK_GE(scale, 0);

   static const int32_t values[] = {

       1,

       10,

       100,

       1000,

       10000,

       100000,

       1000000,

       10000000,

       100000000,

       1000000000};

   DCHECK_GE(sizeof(values) / sizeof(int32_t), ColumnType::MAX_DECIMAL4_PRECISION);

   if (LIKELY(scale < 10)) return values[scale];

   return -1;  // Overflow

 }


 template <>

 inline int64_t DecimalUtil::GetScaleMultiplier<int64_t>(int scale) {

   DCHECK_GE(scale, 0);

   static const int64_t values[] = {

       1ll,

       10ll,

       100ll,

       1000ll,

       10000ll,

       100000ll,

       1000000ll,

       10000000ll,

       100000000ll,

       1000000000ll,

       10000000000ll,

       100000000000ll,

       1000000000000ll,

       10000000000000ll,

       100000000000000ll,

       1000000000000000ll,

       10000000000000000ll,

       100000000000000000ll,

       1000000000000000000ll};

   DCHECK_GE(sizeof(values) / sizeof(int64_t), ColumnType::MAX_DECIMAL8_PRECISION);

   if (LIKELY(scale < 19)) return values[scale];

   return -1;  // Overflow

 }


 template <>

 inline int128_t DecimalUtil::GetScaleMultiplier<int128_t>(int scale) {

   DCHECK_GE(scale, 0);

   static const int128_t values[] = {

       static_cast<int128_t>(1ll),

       static_cast<int128_t>(10ll),

       static_cast<int128_t>(100ll),

       static_cast<int128_t>(1000ll),

       static_cast<int128_t>(10000ll),

       static_cast<int128_t>(100000ll),

       static_cast<int128_t>(1000000ll),

       static_cast<int128_t>(10000000ll),

       static_cast<int128_t>(100000000ll),

       static_cast<int128_t>(1000000000ll),

       static_cast<int128_t>(10000000000ll),

       static_cast<int128_t>(100000000000ll),

       static_cast<int128_t>(1000000000000ll),

       static_cast<int128_t>(10000000000000ll),

       static_cast<int128_t>(100000000000000ll),

       static_cast<int128_t>(1000000000000000ll),

       static_cast<int128_t>(10000000000000000ll),

       static_cast<int128_t>(100000000000000000ll),

       static_cast<int128_t>(1000000000000000000ll),

       static_cast<int128_t>(1000000000000000000ll) * 10ll,

       static_cast<int128_t>(1000000000000000000ll) * 100ll,

       static_cast<int128_t>(1000000000000000000ll) * 1000ll,

       static_cast<int128_t>(1000000000000000000ll) * 10000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000ll,

       static_cast<int128_t>(1000000000000000000ll) * 1000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 10000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 1000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 10000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 1000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 10000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 1000000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 10000000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000000000ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000000000ll * 10ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000000000ll * 100ll,

       static_cast<int128_t>(1000000000000000000ll) * 100000000000000000ll * 1000ll};

   DCHECK_GE(sizeof(values) / sizeof(int128_t), ColumnType::MAX_PRECISION);

   if (LIKELY(scale < 39)) return values[scale];

   return -1;  // Overflow

 }


 }


 #endif

types.h

impala::DecimalUtil::DecodeFromFixedLenByteArray
static void DecodeFromFixedLenByteArray(const uint8_t *buffer, int fixed_len_size, T *v)
Definition: decimal-util.h:87

impala::DecimalUtil::MultiplyByScale
static T MultiplyByScale(const T &v, int scale)
Definition: decimal-util.h:45

impala::ColumnType::MAX_DECIMAL8_PRECISION
static const int MAX_DECIMAL8_PRECISION
The maximum precision representable by a 8-byte decimal (Decimal8Value)
Definition: types.h:77

impala::ColumnType::scale
int scale
Definition: types.h:68

impala::DecimalUtil::EncodeToFixedLenByteArray
static void EncodeToFixedLenByteArray(uint8_t *buffer, int fixed_len_size, const T &v)
Write decimals as big endian (byte comparable) in fixed_len_size bytes.
Definition: decimal-util.h:61

multi-precision.h

impala::BitUtil::ByteSwap
static int64_t ByteSwap(int64_t value)
Swaps the byte order (i.e. endianess)
Definition: bit-util.h:149

impala::DecimalUtil::MAX_UNSCALED_DECIMAL
static int128_t MAX_UNSCALED_DECIMAL
Maximum absolute value of int128_t that we use. This is 38 digits of 9's.
Definition: decimal-util.h:32

impala::DecimalUtil::MultiplyByScale
static T MultiplyByScale(const T &v, const ColumnType &t)
TODO: do we need to handle overflow here or at a higher abstraction.
Definition: decimal-util.h:39

impala::ColumnType::type
PrimitiveType type
Definition: types.h:60

impala::DecimalUtil::GetScaleMultiplier
static T GetScaleMultiplier(int scale)
Definition: decimal-util.h:50

bit-util.h

impala::DecimalUtil
Definition: decimal-util.h:29

impala::DecimalUtil::InitMaxUnscaledDecimal
static void InitMaxUnscaledDecimal()
Initializes MAX_UNSCALED_DECIMAL. Must be called once before using it.
Definition: decimal-util.cc:22

impala::ColumnType::MAX_DECIMAL4_PRECISION
static const int MAX_DECIMAL4_PRECISION
The maximum precision representable by a 4-byte decimal (Decimal4Value)
Definition: types.h:75

impala::ColumnType
Definition: types.h:59

LIKELY
#define LIKELY(expr)
Definition: compiler-util.h:32

impala::ColumnType::MAX_PRECISION
static const int MAX_PRECISION
Must be kept in sync with FE's max precision/scale.
Definition: types.h:71

impala::TYPE_DECIMAL
Definition: types.h:42

impala::int128_t
__int128_t int128_t
We use the c++ int128_t type. This is stored using 16 bytes and very performant.
Definition: multi-precision.h:51