doc/html/read-write-util_8h_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 #ifndef IMPALA_EXEC_READ_WRITE_UTIL_H

 #define IMPALA_EXEC_READ_WRITE_UTIL_H


 #include <boost/cstdint.hpp>

 #include <sstream>

 #include "common/logging.h"

 #include "common/status.h"

 #include "util/bit-util.h"


 namespace impala {


 #define RETURN_IF_FALSE(x) if (UNLIKELY(!(x))) return false


 class ReadWriteUtil {

  public:

   static const int MAX_VINT_LEN = 9;


   const static int MAX_ZINT_LEN = 5;

   const static int MAX_ZLONG_LEN = 10;


   static int PutZInt(int32_t integer, uint8_t* buf);


   static int PutZLong(int64_t longint, uint8_t* buf);


   template<typename T>

   static T GetInt(const uint8_t* buffer);


   static int GetVLong(uint8_t* buf, int64_t* vlong);

   static int GetVInt(uint8_t* buf, int32_t* vint);


   static int64_t PutVLong(int64_t val, uint8_t* buf);

   static int64_t PutVInt(int32_t val, uint8_t* buf);


   static int VLongRequiredBytes(int64_t val);


   static int GetVLong(uint8_t* buf, int64_t offset, int64_t* vlong);


   static void PutInt(uint8_t* buf, uint16_t integer);

   static void PutInt(uint8_t* buf, uint32_t integer);

   static void PutInt(uint8_t* buf, uint64_t integer);


   static std::string HexDump(const uint8_t* buf, int64_t length);

   static std::string HexDump(const char* buf, int64_t length);


   static bool IsNegativeVInt(int8_t byte);


   static int DecodeVIntSize(int8_t byte);


   static int64_t ReadZLong(uint8_t** buf);


   static int32_t ReadZInt(uint8_t** buf);


   template <class T>

   static bool Read(uint8_t** buf, int* buf_len, T* val, Status* status);


   static bool SkipBytes(uint8_t** buf, int* buf_len, int num_bytes, Status* status);

 };


 template<>

 inline uint16_t ReadWriteUtil::GetInt(const uint8_t* buf) {

   return (buf[0] << 8) | buf[1];

 }


 template<>

 inline uint32_t ReadWriteUtil::GetInt(const uint8_t* buf) {

   return (buf[0] << 24) | (buf[1] << 16) | (buf[2] << 8) | buf[3];

 }


 template<>

 inline uint64_t ReadWriteUtil::GetInt(const uint8_t* buf) {

   uint64_t upper_half = GetInt<uint32_t>(buf);

   uint64_t lower_half = GetInt<uint32_t>(buf + 4);

   return lower_half | upper_half << 32;

 }


 inline void ReadWriteUtil::PutInt(uint8_t* buf, uint16_t integer) {

   buf[0] = integer >> 8;

   buf[1] = integer;

 }


 inline void ReadWriteUtil::PutInt(uint8_t* buf, uint32_t integer) {

   uint32_t big_endian = BitUtil::ByteSwap(integer);

   memcpy(buf, &big_endian, sizeof(uint32_t));

 }


 inline void ReadWriteUtil::PutInt(uint8_t* buf, uint64_t integer) {

   uint64_t big_endian = BitUtil::ByteSwap(integer);

   memcpy(buf, &big_endian, sizeof(uint64_t));

 }


 inline int ReadWriteUtil::GetVInt(uint8_t* buf, int32_t* vint) {

   int64_t vlong = 0;

   int len = GetVLong(buf, &vlong);

   *vint = static_cast<int32_t>(vlong);

   return len;

 }


 inline int ReadWriteUtil::GetVLong(uint8_t* buf, int64_t* vlong) {

   return GetVLong(buf, 0, vlong);

 }


 inline int ReadWriteUtil::GetVLong(uint8_t* buf, int64_t offset, int64_t* vlong) {

   int8_t firstbyte = (int8_t) buf[0 + offset];


   int len = DecodeVIntSize(firstbyte);

   if (len > MAX_VINT_LEN) return -1;

   if (len == 1) {

     *vlong = static_cast<int64_t>(firstbyte);

     return len;

   }


   *vlong &= ~*vlong;


   for (int i = 1; i < len; i++) {

     *vlong = (*vlong << 8) | buf[i+offset];

   }


   if (IsNegativeVInt(firstbyte)) {

     *vlong = *vlong ^ ((int64_t) - 1);

   }


   return len;

 }


 inline int ReadWriteUtil::VLongRequiredBytes(int64_t val) {

   // returns size of the encoded long value, not including the 1 byte for length

   if (val & 0xFF00000000000000llu) return 8;

   if (val & 0x00FF000000000000llu) return 7;

   if (val & 0x0000FF0000000000llu) return 6;

   if (val & 0x000000FF00000000llu) return 5;

   if (val & 0x00000000FF000000llu) return 4;

   if (val & 0x0000000000FF0000llu) return 3;

   if (val & 0x000000000000FF00llu) return 2;

   // Values between -112 and 127 are stored using 1 byte,

   // values between -127 and -112 are stored using 2 bytes

   // See ReadWriteUtil::DecodeVIntSize for this case

   if (val < -112) return 2;

   return 1;

 }


 inline int64_t ReadWriteUtil::PutVLong(int64_t val, uint8_t* buf) {

   int64_t num_bytes = VLongRequiredBytes(val);


   if (num_bytes == 1) {

     // store the value itself instead of the length

     buf[0] = static_cast<int8_t>(val);

     return 1;

   }


   // This is how we encode the length for a length less than or equal to 8

   buf[0] = -119 + num_bytes;


   // write to buffer in reversed endianness

   for (int i = 0; i < num_bytes; ++i) {

     buf[i+1] = (val >> (8 * (num_bytes - i - 1))) & 0xFF;

   }


   // +1 for the length byte

   return num_bytes + 1;

 }


 inline int64_t ReadWriteUtil::PutVInt(int32_t val, uint8_t* buf) {

   return PutVLong(val, buf);

 }


 inline int32_t ReadWriteUtil::ReadZInt(uint8_t** buf) {

   int64_t zlong = ReadZLong(buf);

   return static_cast<int32_t>(zlong);

 }


 template <class T>

 inline bool ReadWriteUtil::Read(uint8_t** buf, int* buf_len, T* val, Status* status) {

   int val_len = sizeof(T);

   if (UNLIKELY(val_len > *buf_len)) {

     std::stringstream ss;

     ss << "Cannot read " << val_len << " bytes, buffer length is " << *buf_len;

     *status = Status(ss.str());

     return false;

   }

   *val = *reinterpret_cast<T*>(*buf);

   *buf += val_len;

   *buf_len -= val_len;

   return true;

 }


 inline bool ReadWriteUtil::SkipBytes(uint8_t** buf, int* buf_len, int num_bytes,

                                      Status* status) {

   DCHECK_GE(*buf_len, 0);

   if (UNLIKELY(num_bytes > *buf_len)) {

     std::stringstream ss;

     ss << "Cannot skip " << num_bytes << " bytes, buffer length is " << *buf_len;

     *status = Status(ss.str());

     return false;

   }

   *buf += num_bytes;

   *buf_len -= num_bytes;

   return true;

 }


 inline bool ReadWriteUtil::IsNegativeVInt(int8_t byte) {

   return byte < -120 || (byte >= -112 && byte < 0);

 }


 inline int ReadWriteUtil::DecodeVIntSize(int8_t byte) {

   if (byte >= -112) {

     return 1;

   } else if (byte < -120) {

     return -119 - byte;

   }

   return -111 - byte;

 }


 }

 #endif

impala::ReadWriteUtil::DecodeVIntSize
static int DecodeVIntSize(int8_t byte)
Determines the total length in bytes of a Writable VInt/VLong from the first byte.
Definition: read-write-util.h:254

impala::ReadWriteUtil::MAX_ZINT_LEN
static const int MAX_ZINT_LEN
Maximum lengths for Zigzag encodings.
Definition: read-write-util.h:40

impala::ReadWriteUtil::PutZInt
static int PutZInt(int32_t integer, uint8_t *buf)
Put a zigzag encoded integer into a buffer and return its length.
Definition: read-write-util.cc:38

logging.h

impala::ReadWriteUtil::SkipBytes
static bool SkipBytes(uint8_t **buf, int *buf_len, int num_bytes, Status *status)
Skip the next num_bytes bytes.
Definition: read-write-util.h:236

impala::BitUtil::ByteSwap
static int64_t ByteSwap(int64_t value)
Swaps the byte order (i.e. endianess)
Definition: bit-util.h:149

impala::Status
Definition: status.h:81

impala::ReadWriteUtil::PutInt
static void PutInt(uint8_t *buf, uint16_t integer)
Definition: read-write-util.h:126

impala::ReadWriteUtil::PutVLong
static int64_t PutVLong(int64_t val, uint8_t *buf)
Definition: read-write-util.h:191

impala::ReadWriteUtil::Read
static bool Read(uint8_t **buf, int *buf_len, T *val, Status *status)
Definition: read-write-util.h:222

impala::ReadWriteUtil::ReadZLong
static int64_t ReadZLong(uint8_t **buf)
Definition: read-write-util.cc:24

bit-util.h

impala::ReadWriteUtil::MAX_ZLONG_LEN
static const int MAX_ZLONG_LEN
Definition: read-write-util.h:41

uint64_t

impala::ReadWriteUtil::ReadZInt
static int32_t ReadZInt(uint8_t **buf)
Read a zig-zag encoded int.
Definition: read-write-util.h:216

impala::ReadWriteUtil::GetVInt
static int GetVInt(uint8_t *buf, int32_t *vint)
Definition: read-write-util.h:141

impala::ReadWriteUtil::IsNegativeVInt
static bool IsNegativeVInt(int8_t byte)
Determines the sign of a VInt/VLong from the first byte.
Definition: read-write-util.h:250

status.h

UNLIKELY
#define UNLIKELY(expr)
Definition: compiler-util.h:33

impala::ReadWriteUtil::GetVLong
static int GetVLong(uint8_t *buf, int64_t *vlong)
Definition: read-write-util.h:148

offset
uint8_t offset[7 *64-sizeof(uint64_t)]
Definition: partitioning-throughput-test.cc:37

impala::ReadWriteUtil
Definition: read-write-util.h:34

impala::ReadWriteUtil::HexDump
static std::string HexDump(const uint8_t *buf, int64_t length)
Dump the first length bytes of buf to a Hex string.
Definition: read-write-util.cc:72

impala::ReadWriteUtil::PutVInt
static int64_t PutVInt(int32_t val, uint8_t *buf)
Definition: read-write-util.h:212

impala::ReadWriteUtil::VLongRequiredBytes
static int VLongRequiredBytes(int64_t val)
returns size of the encoded long value, not including the 1 byte for length
Definition: read-write-util.h:175

impala::ReadWriteUtil::MAX_VINT_LEN
static const int MAX_VINT_LEN
Maximum length for Writeable VInt.
Definition: read-write-util.h:37

impala::ReadWriteUtil::GetInt
static T GetInt(const uint8_t *buffer)
Get a big endian integer from a buffer. The buffer does not have to be word aligned.

impala::ReadWriteUtil::PutZLong
static int PutZLong(int64_t longint, uint8_t *buf)
Put a zigzag encoded long integer into a buffer and return its length.
Definition: read-write-util.cc:55