OmniSciDB  8a228a1076
Datum.cpp File Reference
#include <cassert>
#include <cstdio>
#include <cstdlib>
#include <stdexcept>
#include <string>
#include "DateConverters.h"
#include "Logger/Logger.h"
#include "QueryEngine/DateTimeUtils.h"
#include "StringTransform.h"
#include "TimeGM.h"
#include "misc.h"
#include "sqltypes.h"
+ Include dependency graph for Datum.cpp:

Go to the source code of this file.

Functions

int64_t parse_numeric (const std::string_view s, SQLTypeInfo &ti)
 
Datum StringToDatum (std::string_view s, SQLTypeInfo &ti)
 
bool DatumEqual (const Datum a, const Datum b, const SQLTypeInfo &ti)
 
std::string DatumToString (Datum d, const SQLTypeInfo &ti)
 
SQLTypes decimal_to_int_type (const SQLTypeInfo &ti)
 
int64_t convert_decimal_value_to_scale (const int64_t decimal_value, const SQLTypeInfo &type_info, const SQLTypeInfo &new_type_info)
 

Function Documentation

◆ convert_decimal_value_to_scale()

int64_t convert_decimal_value_to_scale ( const int64_t  decimal_value,
const SQLTypeInfo type_info,
const SQLTypeInfo new_type_info 
)

Definition at line 315 of file Datum.cpp.

References SQLTypeInfo::get_scale().

Referenced by import_export::TypedImportBuffer::add_value(), Analyzer::Constant::cast_number(), SQLTypeInfo::get_storage_size(), anonymous_namespace{ArrowImporter.h}::ArrowValue< arrow::Decimal128 >::operator const DATA_TYPE(), and anonymous_namespace{TypedDataAccessors.h}::put_scalar().

317  {
318  auto converted_decimal_value = decimal_value;
319  if (new_type_info.get_scale() > type_info.get_scale()) {
320  for (int i = 0; i < new_type_info.get_scale() - type_info.get_scale(); i++) {
321  converted_decimal_value *= 10;
322  }
323  } else if (new_type_info.get_scale() < type_info.get_scale()) {
324  for (int i = 0; i < type_info.get_scale() - new_type_info.get_scale(); i++) {
325  if (converted_decimal_value > 0) {
326  converted_decimal_value = (converted_decimal_value + 5) / 10;
327  } else {
328  converted_decimal_value = (converted_decimal_value - 5) / 10;
329  }
330  }
331  }
332  return converted_decimal_value;
333 }
HOST DEVICE int get_scale() const
Definition: sqltypes.h:264
+ Here is the call graph for this function:
+ Here is the caller graph for this function:

◆ DatumEqual()

bool DatumEqual ( const Datum  a,
const Datum  b,
const SQLTypeInfo ti 
)

Definition at line 190 of file Datum.cpp.

References Datum::bigintval, Datum::boolval, Datum::doubleval, Datum::floatval, SQLTypeInfo::get_compression(), SQLTypeInfo::get_type(), Datum::intval, kBIGINT, kBOOLEAN, kCHAR, kDATE, kDECIMAL, kDOUBLE, kENCODING_DICT, kFLOAT, kINT, kINTERVAL_DAY_TIME, kINTERVAL_YEAR_MONTH, kNUMERIC, kSMALLINT, kTEXT, kTIME, kTIMESTAMP, kTINYINT, kVARCHAR, Datum::smallintval, Datum::stringval, and Datum::tinyintval.

Referenced by SQLTypeInfo::get_storage_size(), and ChunkMetadata::operator==().

190  {
191  switch (ti.get_type()) {
192  case kBOOLEAN:
193  return a.boolval == b.boolval;
194  case kBIGINT:
195  case kNUMERIC:
196  case kDECIMAL:
197  return a.bigintval == b.bigintval;
198  case kINT:
199  return a.intval == b.intval;
200  case kSMALLINT:
201  return a.smallintval == b.smallintval;
202  case kTINYINT:
203  return a.tinyintval == b.tinyintval;
204  case kFLOAT:
205  return a.floatval == b.floatval;
206  case kDOUBLE:
207  return a.doubleval == b.doubleval;
208  case kTIME:
209  case kTIMESTAMP:
210  case kDATE:
211  case kINTERVAL_DAY_TIME:
213  return a.bigintval == b.bigintval;
214  case kTEXT:
215  case kVARCHAR:
216  case kCHAR:
217  if (ti.get_compression() == kENCODING_DICT) {
218  return a.intval == b.intval;
219  }
220  if (a.stringval == nullptr && b.stringval == nullptr) {
221  return true;
222  }
223  if (a.stringval == nullptr || b.stringval == nullptr) {
224  return false;
225  }
226  return *a.stringval == *b.stringval;
227  default:
228  return false;
229  }
230  return false;
231 }
int8_t tinyintval
Definition: sqltypes.h:135
Definition: sqltypes.h:51
bool boolval
Definition: sqltypes.h:134
HOST DEVICE EncodingType get_compression() const
Definition: sqltypes.h:267
int32_t intval
Definition: sqltypes.h:137
float floatval
Definition: sqltypes.h:139
int64_t bigintval
Definition: sqltypes.h:138
int16_t smallintval
Definition: sqltypes.h:136
std::string * stringval
Definition: sqltypes.h:143
Definition: sqltypes.h:54
Definition: sqltypes.h:55
Definition: sqltypes.h:43
HOST DEVICE SQLTypes get_type() const
Definition: sqltypes.h:259
Definition: sqltypes.h:47
double doubleval
Definition: sqltypes.h:140
+ Here is the call graph for this function:
+ Here is the caller graph for this function:

◆ DatumToString()

std::string DatumToString ( Datum  d,
const SQLTypeInfo ti 
)

Definition at line 236 of file Datum.cpp.

References Datum::bigintval, Datum::boolval, CHECK_EQ, CHECK_LE, Datum::doubleval, Datum::floatval, shared::formatDate(), shared::formatDateTime(), shared::formatHMS(), SQLTypeInfo::get_dimension(), SQLTypeInfo::get_scale(), SQLTypeInfo::get_type(), SQLTypeInfo::get_type_name(), Datum::intval, kBIGINT, kBOOLEAN, kCHAR, kDATE, kDECIMAL, kDOUBLE, kFLOAT, kINT, kINTERVAL_DAY_TIME, kINTERVAL_YEAR_MONTH, kNUMERIC, kSMALLINT, kTEXT, kTIME, kTIMESTAMP, kTINYINT, kVARCHAR, Datum::smallintval, Datum::stringval, Datum::tinyintval, and to_string().

Referenced by Analyzer::Constant::cast_to_string(), datum_to_string(), ChunkMetadata::dump(), SQLTypeInfo::get_storage_size(), anonymous_namespace{ArrowImporter.h}::ArrowValue< int64_t >::operator const std::string(), Analyzer::Constant::toString(), Fragmenter_Namespace::InsertOrderFragmenter::updateChunkStats(), and ScalarExprToSql::visitConstant().

236  {
237  constexpr size_t buf_size = 32;
238  char buf[buf_size]; // Hold "2000-03-01 12:34:56.123456789" and large years.
239  switch (ti.get_type()) {
240  case kBOOLEAN:
241  if (d.boolval) {
242  return "t";
243  }
244  return "f";
245  case kNUMERIC:
246  case kDECIMAL: {
247  // we need to consider buf_size including the scale and null terminator
248  char str[ti.get_dimension() + ti.get_scale() + 2];
249  double v = (double)d.bigintval / pow(10, ti.get_scale());
250  sprintf(str, "%*.*f", ti.get_dimension(), ti.get_scale(), v);
251  return std::string(str);
252  }
253  case kINT:
254  return std::to_string(d.intval);
255  case kSMALLINT:
256  return std::to_string(d.smallintval);
257  case kTINYINT:
258  return std::to_string(d.tinyintval);
259  case kBIGINT:
260  return std::to_string(d.bigintval);
261  case kFLOAT:
262  return std::to_string(d.floatval);
263  case kDOUBLE:
264  return std::to_string(d.doubleval);
265  case kTIME: {
266  size_t const len = shared::formatHMS(buf, buf_size, d.bigintval);
267  CHECK_EQ(8u, len); // 8 == strlen("HH:MM:SS")
268  return buf;
269  }
270  case kTIMESTAMP: {
271  unsigned const dim = ti.get_dimension(); // assumes dim <= 9
272  size_t const len = shared::formatDateTime(buf, buf_size, d.bigintval, dim);
273  CHECK_LE(19u + bool(dim) + dim, len); // 19 = strlen("YYYY-MM-DD HH:MM:SS")
274  return buf;
275  }
276  case kDATE: {
277  size_t const len = shared::formatDate(buf, buf_size, d.bigintval);
278  CHECK_LE(10u, len); // 10 == strlen("YYYY-MM-DD")
279  return buf;
280  }
281  case kINTERVAL_DAY_TIME:
282  return std::to_string(d.bigintval) + " ms (day-time interval)";
284  return std::to_string(d.bigintval) + " month(s) (year-month interval)";
285  case kTEXT:
286  case kVARCHAR:
287  case kCHAR:
288  if (d.stringval == nullptr) {
289  return "NULL";
290  }
291  return *d.stringval;
292  default:
293  throw std::runtime_error("Internal error: invalid type " + ti.get_type_name() +
294  " in DatumToString.");
295  }
296  return "";
297 }
int8_t tinyintval
Definition: sqltypes.h:135
#define CHECK_EQ(x, y)
Definition: Logger.h:205
Definition: sqltypes.h:51
bool boolval
Definition: sqltypes.h:134
size_t formatDateTime(char *buf, size_t const max, int64_t const timestamp, int const dimension)
Definition: misc.cpp:42
int32_t intval
Definition: sqltypes.h:137
HOST DEVICE int get_scale() const
Definition: sqltypes.h:264
std::string to_string(char const *&&v)
size_t formatHMS(char *buf, size_t const max, int64_t const unixtime)
Definition: misc.cpp:78
float floatval
Definition: sqltypes.h:139
int64_t bigintval
Definition: sqltypes.h:138
int16_t smallintval
Definition: sqltypes.h:136
std::string * stringval
Definition: sqltypes.h:143
size_t formatDate(char *buf, size_t const max, int64_t const unixtime)
Definition: misc.cpp:25
Definition: sqltypes.h:54
Definition: sqltypes.h:55
#define CHECK_LE(x, y)
Definition: Logger.h:208
std::string get_type_name() const
Definition: sqltypes.h:362
HOST DEVICE int get_dimension() const
Definition: sqltypes.h:261
Definition: sqltypes.h:43
HOST DEVICE SQLTypes get_type() const
Definition: sqltypes.h:259
Definition: sqltypes.h:47
double doubleval
Definition: sqltypes.h:140
+ Here is the call graph for this function:
+ Here is the caller graph for this function:

◆ decimal_to_int_type()

SQLTypes decimal_to_int_type ( const SQLTypeInfo ti)

Definition at line 299 of file Datum.cpp.

References CHECK, SQLTypeInfo::get_size(), kBIGINT, kINT, kNULLT, kSMALLINT, and kTINYINT.

Referenced by import_export::TypedImportBuffer::add_value(), CodeGenerator::codegen(), CodeGenerator::codegenIntConst(), anonymous_namespace{LogicalIR.cpp}::contains_unsafe_division(), import_export::Loader::distributeToShards(), extract_from_datum(), anonymous_namespace{ColumnIR.cpp}::get_col_decoder(), SQLTypeInfo::get_storage_size(), CgenState::getOrAddLiteral(), ResultSet::makeTargetValue(), import_export::NullArrayDatum(), import_export::NullDatum(), import_export::TypedImportBuffer::pop_value(), import_export::TDatumToDatum(), anonymous_namespace{ExpressionRewrite.cpp}::ConstantFoldingVisitor::visitBinOper(), and anonymous_namespace{ExpressionRewrite.cpp}::ConstantFoldingVisitor::visitUOper().

299  {
300  switch (ti.get_size()) {
301  case 1:
302  return kTINYINT;
303  case 2:
304  return kSMALLINT;
305  case 4:
306  return kINT;
307  case 8:
308  return kBIGINT;
309  default:
310  CHECK(false);
311  }
312  return kNULLT;
313 }
HOST DEVICE int get_size() const
Definition: sqltypes.h:269
#define CHECK(condition)
Definition: Logger.h:197
Definition: sqltypes.h:47
+ Here is the call graph for this function:
+ Here is the caller graph for this function:

◆ parse_numeric()

int64_t parse_numeric ( const std::string_view  s,
SQLTypeInfo ti 
)

Definition at line 71 of file Datum.cpp.

References CHECK_GE, SQLTypeInfo::get_dimension(), SQLTypeInfo::get_scale(), run_benchmark_import::result, SQLTypeInfo::set_dimension(), SQLTypeInfo::set_notnull(), SQLTypeInfo::set_scale(), and to_string().

Referenced by StringToDatum().

71  {
72  assert(s.length() <= 20);
73  size_t dot = s.find_first_of('.', 0);
74  std::string before_dot;
75  std::string after_dot;
76  if (dot != std::string::npos) {
77  // make .99 as 0.99, or std::stoll below throws exception 'std::invalid_argument'
78  before_dot = (0 == dot) ? "0" : s.substr(0, dot);
79  after_dot = s.substr(dot + 1);
80  } else {
81  before_dot = s;
82  after_dot = "0";
83  }
84  const bool is_negative = before_dot.find_first_of('-', 0) != std::string::npos;
85  const int64_t sign = is_negative ? -1 : 1;
86  int64_t result;
87  result = std::abs(std::stoll(before_dot));
88  int64_t fraction = 0;
89  const size_t before_dot_digits = before_dot.length() - (is_negative ? 1 : 0);
90  if (!after_dot.empty()) {
91  fraction = std::stoll(after_dot);
92  }
93  if (ti.get_dimension() == 0) {
94  // set the type info based on the literal string
95  ti.set_scale(static_cast<int>(after_dot.length()));
96  ti.set_dimension(static_cast<int>(before_dot_digits + ti.get_scale()));
97  ti.set_notnull(false);
98  } else {
99  CHECK_GE(ti.get_scale(), 0);
100  if (before_dot_digits + ti.get_scale() > static_cast<size_t>(ti.get_dimension())) {
101  throw std::runtime_error("numeric value " + std::string(s) +
102  " exceeds the maximum precision of " +
104  }
105  for (size_t i = static_cast<size_t>(ti.get_scale()); i < after_dot.length(); ++i) {
106  fraction /= 10; // truncate the digits after decimal point.
107  }
108  }
109  // the following loop can be made more efficient if needed
110  for (int i = 0; i < ti.get_scale(); i++) {
111  result *= 10;
112  }
113  if (result < 0) {
114  result -= fraction;
115  } else {
116  result += fraction;
117  }
118  return result * sign;
119 }
#define CHECK_GE(x, y)
Definition: Logger.h:210
HOST DEVICE int get_scale() const
Definition: sqltypes.h:264
std::string to_string(char const *&&v)
void set_scale(int s)
Definition: sqltypes.h:354
void set_dimension(int d)
Definition: sqltypes.h:351
HOST DEVICE int get_dimension() const
Definition: sqltypes.h:261
void set_notnull(bool n)
Definition: sqltypes.h:356
+ Here is the call graph for this function:
+ Here is the caller graph for this function:

◆ StringToDatum()

Datum StringToDatum ( std::string_view  s,
SQLTypeInfo ti 
)

Definition at line 124 of file Datum.cpp.

References Datum::bigintval, Datum::boolval, Datum::doubleval, Datum::floatval, SQLTypeInfo::get_dimension(), SQLTypeInfo::get_type(), SQLTypeInfo::get_type_name(), Datum::intval, kARRAY, kBIGINT, kBOOLEAN, kCOLUMN, kDATE, kDECIMAL, kDOUBLE, kFLOAT, kINT, kLINESTRING, kMULTIPOLYGON, kNUMERIC, kPOINT, kPOLYGON, kSMALLINT, kTIME, kTIMESTAMP, kTINYINT, parse_numeric(), Datum::smallintval, Datum::tinyintval, and to_upper().

Referenced by import_export::TypedImportBuffer::add_value(), Parser::FixedPtLiteral::analyze(), Analyzer::Constant::cast_from_string(), SQLTypeInfo::get_storage_size(), anonymous_namespace{ArrowImporter.h}::ArrowValue< std::string >::operator const bool(), anonymous_namespace{ArrowImporter.h}::ArrowValue< std::string >::operator const DATA_TYPE(), populate_TColumn(), and import_export::StringToArray().

124  {
125  Datum d;
126  try {
127  switch (ti.get_type()) {
128  case kARRAY:
129  case kCOLUMN:
130  break;
131  case kBOOLEAN:
132  if (s == "t" || s == "T" || s == "1" || to_upper(std::string(s)) == "TRUE") {
133  d.boolval = true;
134  } else if (s == "f" || s == "F" || s == "0" ||
135  to_upper(std::string(s)) == "FALSE") {
136  d.boolval = false;
137  } else {
138  throw std::runtime_error("Invalid string for boolean " + std::string(s));
139  }
140  break;
141  case kNUMERIC:
142  case kDECIMAL:
143  d.bigintval = parse_numeric(s, ti);
144  break;
145  case kBIGINT:
146  d.bigintval = std::stoll(std::string(s));
147  break;
148  case kINT:
149  d.intval = std::stoi(std::string(s));
150  break;
151  case kSMALLINT:
152  d.smallintval = std::stoi(std::string(s));
153  break;
154  case kTINYINT:
155  d.tinyintval = std::stoi(std::string(s));
156  break;
157  case kFLOAT:
158  d.floatval = std::stof(std::string(s));
159  break;
160  case kDOUBLE:
161  d.doubleval = std::stod(std::string(s));
162  break;
163  case kTIME:
164  d.bigintval = DateTimeStringValidate<kTIME>()(std::string(s), ti.get_dimension());
165  break;
166  case kTIMESTAMP:
167  d.bigintval =
168  DateTimeStringValidate<kTIMESTAMP>()(std::string(s), ti.get_dimension());
169  break;
170  case kDATE:
171  d.bigintval = DateTimeStringValidate<kDATE>()(std::string(s), ti.get_dimension());
172  break;
173  case kPOINT:
174  case kLINESTRING:
175  case kPOLYGON:
176  case kMULTIPOLYGON:
177  throw std::runtime_error("Internal error: geometry type in StringToDatum.");
178  default:
179  throw std::runtime_error("Internal error: invalid type in StringToDatum.");
180  }
181  } catch (const std::invalid_argument&) {
182  throw std::runtime_error("Invalid conversion from string to " + ti.get_type_name());
183  } catch (const std::out_of_range&) {
184  throw std::runtime_error("Got out of range error during conversion from string to " +
185  ti.get_type_name());
186  }
187  return d;
188 }
int8_t tinyintval
Definition: sqltypes.h:135
Definition: sqltypes.h:51
int64_t parse_numeric(const std::string_view s, SQLTypeInfo &ti)
Definition: Datum.cpp:71
bool boolval
Definition: sqltypes.h:134
int32_t intval
Definition: sqltypes.h:137
float floatval
Definition: sqltypes.h:139
int64_t bigintval
Definition: sqltypes.h:138
int16_t smallintval
Definition: sqltypes.h:136
std::string to_upper(const std::string &str)
Definition: sqltypes.h:55
std::string get_type_name() const
Definition: sqltypes.h:362
HOST DEVICE int get_dimension() const
Definition: sqltypes.h:261
HOST DEVICE SQLTypes get_type() const
Definition: sqltypes.h:259
Definition: sqltypes.h:47
double doubleval
Definition: sqltypes.h:140
+ Here is the call graph for this function:
+ Here is the caller graph for this function: