doc/html/cast-functions_8cc_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #include "exprs/cast-functions.h"


 #include <boost/lexical_cast.hpp>


 #include "exprs/anyval-util.h"

 #include "exprs/decimal-functions.h"

 #include "runtime/timestamp-value.h"

 #include "util/string-parser.h"

 #include "string-functions.h"


 #include "common/names.h"


 using namespace impala;

 using namespace impala_udf;


 // The maximum number of characters need to represent a floating-point number (float or

 // double) as a string. 24 = 17 (maximum significant digits) + 1 (decimal point) + 1 ('E')

 // + 3 (exponent digits) + 2 (negative signs) (see http://stackoverflow.com/a/1701085)

 const int MAX_FLOAT_CHARS = 24;


 #define CAST_FUNCTION(from_type, to_type) \

   to_type CastFunctions::CastTo##to_type(FunctionContext* ctx, const from_type& val) { \

     if (val.is_null) return to_type::null(); \

     return to_type(val.val); \

   }


 CAST_FUNCTION(TinyIntVal, BooleanVal)

 CAST_FUNCTION(SmallIntVal, BooleanVal)

 CAST_FUNCTION(IntVal, BooleanVal)

 CAST_FUNCTION(BigIntVal, BooleanVal)

 CAST_FUNCTION(FloatVal, BooleanVal)

 CAST_FUNCTION(DoubleVal, BooleanVal)


 CAST_FUNCTION(BooleanVal, TinyIntVal)

 CAST_FUNCTION(SmallIntVal, TinyIntVal)

 CAST_FUNCTION(IntVal, TinyIntVal)

 CAST_FUNCTION(BigIntVal, TinyIntVal)

 CAST_FUNCTION(FloatVal, TinyIntVal)

 CAST_FUNCTION(DoubleVal, TinyIntVal)


 CAST_FUNCTION(BooleanVal, SmallIntVal)

 CAST_FUNCTION(TinyIntVal, SmallIntVal)

 CAST_FUNCTION(IntVal, SmallIntVal)

 CAST_FUNCTION(BigIntVal, SmallIntVal)

 CAST_FUNCTION(FloatVal, SmallIntVal)

 CAST_FUNCTION(DoubleVal, SmallIntVal)


 CAST_FUNCTION(BooleanVal, IntVal)

 CAST_FUNCTION(TinyIntVal, IntVal)

 CAST_FUNCTION(SmallIntVal, IntVal)

 CAST_FUNCTION(BigIntVal, IntVal)

 CAST_FUNCTION(FloatVal, IntVal)

 CAST_FUNCTION(DoubleVal, IntVal)


 CAST_FUNCTION(BooleanVal, BigIntVal)

 CAST_FUNCTION(TinyIntVal, BigIntVal)

 CAST_FUNCTION(SmallIntVal, BigIntVal)

 CAST_FUNCTION(IntVal, BigIntVal)

 CAST_FUNCTION(FloatVal, BigIntVal)

 CAST_FUNCTION(DoubleVal, BigIntVal)


 CAST_FUNCTION(BooleanVal, FloatVal)

 CAST_FUNCTION(TinyIntVal, FloatVal)

 CAST_FUNCTION(SmallIntVal, FloatVal)

 CAST_FUNCTION(IntVal, FloatVal)

 CAST_FUNCTION(BigIntVal, FloatVal)

 CAST_FUNCTION(DoubleVal, FloatVal)


 CAST_FUNCTION(BooleanVal, DoubleVal)

 CAST_FUNCTION(TinyIntVal, DoubleVal)

 CAST_FUNCTION(SmallIntVal, DoubleVal)

 CAST_FUNCTION(IntVal, DoubleVal)

 CAST_FUNCTION(BigIntVal, DoubleVal)

 CAST_FUNCTION(FloatVal, DoubleVal)


 #define CAST_FROM_STRING(num_type, native_type, string_parser_fn) \

   num_type CastFunctions::CastTo##num_type(FunctionContext* ctx, const StringVal& val) { \

     if (val.is_null) return num_type::null(); \

     StringParser::ParseResult result; \

     num_type ret; \

     ret.val = StringParser::string_parser_fn<native_type>( \

         reinterpret_cast<char*>(val.ptr), val.len, &result); \

     if (UNLIKELY(result != StringParser::PARSE_SUCCESS)) return num_type::null(); \

     return ret; \

   }


 CAST_FROM_STRING(TinyIntVal, int8_t, StringToInt)

 CAST_FROM_STRING(SmallIntVal, int16_t, StringToInt)

 CAST_FROM_STRING(IntVal, int32_t, StringToInt)

 CAST_FROM_STRING(BigIntVal, int64_t, StringToInt)

 CAST_FROM_STRING(FloatVal, float, StringToFloat)

 CAST_FROM_STRING(DoubleVal, double, StringToFloat)


 #define CAST_TO_STRING(num_type) \

   StringVal CastFunctions::CastToStringVal(FunctionContext* ctx, const num_type& val) { \

     if (val.is_null) return StringVal::null(); \

     ColumnType rtype = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType()); \

     StringVal sv = AnyValUtil::FromString(ctx, lexical_cast<string>(val.val)); \

     AnyValUtil::TruncateIfNecessary(rtype, &sv); \

     return sv; \

   }


 CAST_TO_STRING(BooleanVal);

 CAST_TO_STRING(SmallIntVal);

 CAST_TO_STRING(IntVal);

 CAST_TO_STRING(BigIntVal);


 #define CAST_FLOAT_TO_STRING(float_type, format) \

   StringVal CastFunctions::CastToStringVal(FunctionContext* ctx, const float_type& val) { \

     if (val.is_null) return StringVal::null(); \

     /* val.val could be -nan, return "nan" instead */ \

     if (isnan(val.val)) return StringVal("nan"); \

     /* Add 1 to MAX_FLOAT_CHARS since snprintf adds a trailing '\0' */ \

     StringVal sv(ctx, MAX_FLOAT_CHARS + 1); \

     sv.len = snprintf(reinterpret_cast<char*>(sv.ptr), sv.len, format, val.val); \

     DCHECK_GT(sv.len, 0); \

     DCHECK_LE(sv.len, MAX_FLOAT_CHARS); \

     ColumnType return_type = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType()); \

     AnyValUtil::TruncateIfNecessary(return_type, &sv); \

     return sv; \

   }


 // Floats have up to 9 significant digits, doubles up to 17

 // (see http://en.wikipedia.org/wiki/Single-precision_floating-point_format

 // and http://en.wikipedia.org/wiki/Double-precision_floating-point_format)

 CAST_FLOAT_TO_STRING(FloatVal, "%.9g");

 CAST_FLOAT_TO_STRING(DoubleVal, "%.17g");


 // Special-case tinyint because boost thinks it's a char and handles it differently.

 // e.g. '0' is written as an empty string.

 StringVal CastFunctions::CastToStringVal(FunctionContext* ctx, const TinyIntVal& val) {

   if (val.is_null) return StringVal::null();

   int64_t tmp_val = val.val;

   ColumnType rtype = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType());

   StringVal sv = AnyValUtil::FromString(ctx, lexical_cast<string>(tmp_val));

   AnyValUtil::TruncateIfNecessary(rtype, &sv);

   return sv;

 }


 StringVal CastFunctions::CastToStringVal(FunctionContext* ctx, const TimestampVal& val) {

   if (val.is_null) return StringVal::null();

   TimestampValue tv = TimestampValue::FromTimestampVal(val);

   ColumnType rtype = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType());

   StringVal sv = AnyValUtil::FromString(ctx, lexical_cast<string>(tv));

   AnyValUtil::TruncateIfNecessary(rtype, &sv);

   return sv;

 }


 StringVal CastFunctions::CastToStringVal(FunctionContext* ctx, const StringVal& val) {

   if (val.is_null) return StringVal::null();

   StringVal sv;

   ColumnType type = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType());

   sv.ptr = val.ptr;

   sv.len = val.len;

   AnyValUtil::TruncateIfNecessary(type, &sv);

   return sv;

 }


 StringVal CastFunctions::CastToChar(FunctionContext* ctx, const StringVal& val) {

   if (val.is_null) return StringVal::null();


   ColumnType type = AnyValUtil::TypeDescToColumnType(ctx->GetReturnType());

   DCHECK(type.type == TYPE_CHAR);

   DCHECK_GE(type.len, 1);

   char* cptr;

   if (type.len > val.len) {

     cptr = reinterpret_cast<char*>(ctx->impl()->AllocateLocal(type.len));

     memcpy(cptr, val.ptr, min(type.len, val.len));

     StringValue::PadWithSpaces(cptr, type.len, val.len);

   } else {

     cptr = reinterpret_cast<char*>(val.ptr);

   }

   StringVal sv;

   sv.ptr = reinterpret_cast<uint8_t*>(cptr);

   sv.len = type.len;

   return sv;

 }


 #define CAST_FROM_TIMESTAMP(to_type) \

   to_type CastFunctions::CastTo##to_type( \

       FunctionContext* ctx, const TimestampVal& val) { \

     if (val.is_null) return to_type::null(); \

     TimestampValue tv = TimestampValue::FromTimestampVal(val); \

     if (!tv.HasDate()) return to_type::null(); \

     return to_type(tv.ToUnixTime()); \

   }


 CAST_FROM_TIMESTAMP(BooleanVal);

 CAST_FROM_TIMESTAMP(TinyIntVal);

 CAST_FROM_TIMESTAMP(SmallIntVal);

 CAST_FROM_TIMESTAMP(IntVal);

 CAST_FROM_TIMESTAMP(BigIntVal);


 #define CAST_FROM_SUBSECOND_TIMESTAMP(to_type) \

   to_type CastFunctions::CastTo##to_type( \

       FunctionContext* ctx, const TimestampVal& val) { \

     if (val.is_null) return to_type::null(); \

     TimestampValue tv = TimestampValue::FromTimestampVal(val); \

     if (!tv.HasDate()) return to_type::null(); \

     return to_type(tv.ToSubsecondUnixTime()); \

   }


 CAST_FROM_SUBSECOND_TIMESTAMP(FloatVal);

 CAST_FROM_SUBSECOND_TIMESTAMP(DoubleVal);


 #define CAST_TO_TIMESTAMP(from_type) \

   TimestampVal CastFunctions::CastToTimestampVal(FunctionContext* ctx, \

                                                  const from_type& val) { \

     if (val.is_null) return TimestampVal::null(); \

     TimestampValue timestamp_value(val.val); \

     if (!timestamp_value.HasDate()) return TimestampVal::null(); \

     TimestampVal result; \

     timestamp_value.ToTimestampVal(&result); \

     return result; \

   }


 CAST_TO_TIMESTAMP(BooleanVal);

 CAST_TO_TIMESTAMP(TinyIntVal);

 CAST_TO_TIMESTAMP(SmallIntVal);

 CAST_TO_TIMESTAMP(IntVal);

 CAST_TO_TIMESTAMP(BigIntVal);

 CAST_TO_TIMESTAMP(FloatVal);

 CAST_TO_TIMESTAMP(DoubleVal);


 TimestampVal CastFunctions::CastToTimestampVal(FunctionContext* ctx,

                                                const StringVal& val) {

   if (val.is_null) return TimestampVal::null();

   TimestampValue timestamp_value(reinterpret_cast<char*>(val.ptr), val.len);

   // Return null if 'val' did not parse

   if (!timestamp_value.HasDateOrTime()) return TimestampVal::null();

   TimestampVal result;

   timestamp_value.ToTimestampVal(&result);

   return result;

 }

impala_udf::TinyIntVal::val
int8_t val
Definition: udf.h:383

cast-functions.h

timestamp-value.h

impala::AnyValUtil::TruncateIfNecessary
static void TruncateIfNecessary(const ColumnType &type, StringVal *val)
Definition: anyval-util.h:188

impala_udf::FunctionContext::impl
impala::FunctionContextImpl * impl()
TODO: Add mechanism for UDAs to update stats similar to runtime profile counters. ...
Definition: udf.h:202

impala::TYPE_CHAR
Definition: types.h:47

impala_udf::FunctionContext::GetReturnType
const TypeDesc & GetReturnType() const
Definition: udf-ir.cc:34

string-functions.h

CAST_TO_STRING
#define CAST_TO_STRING(num_type)
Definition: cast-functions.cc:108

impala::AnyValUtil::TypeDescToColumnType
static ColumnType TypeDescToColumnType(const FunctionContext::TypeDesc &type)
Definition: anyval-util.cc:101

CAST_FUNCTION
#define CAST_FUNCTION(from_type, to_type)
Definition: cast-functions.cc:35

impala_udf::DoubleVal
Definition: udf.h:475

impala::CastFunctions::CastToTimestampVal
static TimestampVal CastToTimestampVal(FunctionContext *context, const BooleanVal &val)

CAST_FLOAT_TO_STRING
#define CAST_FLOAT_TO_STRING(float_type, format)
Definition: cast-functions.cc:122

impala::TimestampValue::HasDateOrTime
bool HasDateOrTime() const
Definition: timestamp-value.h:134

impala::StringValue::PadWithSpaces
static void PadWithSpaces(char *cptr, int64_t cptr_len, int64_t num_chars)
Definition: string-value.inline.h:100

CAST_TO_TIMESTAMP
#define CAST_TO_TIMESTAMP(from_type)
Definition: cast-functions.cc:220

CAST_FROM_TIMESTAMP
#define CAST_FROM_TIMESTAMP(to_type)
Definition: cast-functions.cc:193

impala_udf::TimestampVal
This object has a compatible storage format with boost::ptime.
Definition: udf.h:495

impala::CastFunctions::CastToChar
static StringVal CastToChar(FunctionContext *context, const StringVal &val)
Definition: cast-functions.cc:173

impala_udf::StringVal::ptr
uint8_t * ptr
Definition: udf.h:523

impala::TimestampValue::ToTimestampVal
void ToTimestampVal(impala_udf::TimestampVal *tv) const
Definition: timestamp-value.h:121

impala_udf::FunctionContext
Definition: udf.h:47

impala_udf::AnyVal::is_null
bool is_null
Definition: udf.h:359

impala_udf::TinyIntVal
Definition: udf.h:382

impala_udf::FloatVal
Definition: udf.h:458

impala::ColumnType::type
PrimitiveType type
Definition: types.h:60

CAST_FROM_SUBSECOND_TIMESTAMP
#define CAST_FROM_SUBSECOND_TIMESTAMP(to_type)
Definition: cast-functions.cc:208

anyval-util.h

string-parser.h

impala_udf::SmallIntVal
Definition: udf.h:401

impala::TimestampValue
Definition: timestamp-value.h:65

impala_udf::StringVal
Definition: udf.h:521

impala::ColumnType::len
int len
Only set if type == TYPE_CHAR or type == TYPE_VARCHAR.
Definition: types.h:62

impala::AnyValUtil::FromString
static StringVal FromString(FunctionContext *ctx, const std::string &s)
Definition: anyval-util.h:183

CAST_FROM_STRING
#define CAST_FROM_STRING(num_type, native_type, string_parser_fn)
Definition: cast-functions.cc:90

impala_udf::IntVal
Definition: udf.h:420

impala::TimestampValue::FromTimestampVal
static TimestampValue FromTimestampVal(const impala_udf::TimestampVal &udf_value)
Definition: timestamp-value.h:111

impala_udf::BigIntVal
Definition: udf.h:439

impala::ColumnType
Definition: types.h:59

names.h

impala::FunctionContextImpl::AllocateLocal
uint8_t * AllocateLocal(int byte_size)
Definition: udf.cc:386

MAX_FLOAT_CHARS
const int MAX_FLOAT_CHARS
Definition: cast-functions.cc:33

decimal-functions.h

impala::CastFunctions::CastToStringVal
static StringVal CastToStringVal(FunctionContext *context, const BooleanVal &val)

impala_udf::StringVal::len
int len
Definition: udf.h:522

impala_udf::BooleanVal
Definition: udf.h:363