#include "parquet_timestamp.hpp" #include "duckdb.hpp" #include "duckdb/common/types/date.hpp" #include "duckdb/common/types/time.hpp" #include "duckdb/common/types/timestamp.hpp" namespace duckdb { // surely they are joking static constexpr int64_t JULIAN_TO_UNIX_EPOCH_DAYS = 2440588LL; static constexpr int64_t MILLISECONDS_PER_DAY = 86400000LL; static constexpr int64_t MICROSECONDS_PER_DAY = MILLISECONDS_PER_DAY * 1000LL; static constexpr int64_t NANOSECONDS_PER_MICRO = 1000LL; static constexpr int64_t NANOSECONDS_PER_DAY = MICROSECONDS_PER_DAY * 1000LL; static inline int64_t ImpalaTimestampToDays(const Int96 &impala_timestamp) { return impala_timestamp.value[2] - JULIAN_TO_UNIX_EPOCH_DAYS; } static int64_t ImpalaTimestampToMicroseconds(const Int96 &impala_timestamp) { int64_t days_since_epoch = ImpalaTimestampToDays(impala_timestamp); auto nanoseconds = Load(const_data_ptr_cast(impala_timestamp.value)); auto microseconds = nanoseconds / NANOSECONDS_PER_MICRO; return days_since_epoch * MICROSECONDS_PER_DAY + microseconds; } static int64_t ImpalaTimestampToNanoseconds(const Int96 &impala_timestamp) { int64_t days_since_epoch = ImpalaTimestampToDays(impala_timestamp); auto nanoseconds = Load(const_data_ptr_cast(impala_timestamp.value)); return days_since_epoch * NANOSECONDS_PER_DAY + nanoseconds; } timestamp_ns_t ImpalaTimestampToTimestampNS(const Int96 &raw_ts) { timestamp_ns_t result; result.value = ImpalaTimestampToNanoseconds(raw_ts); return result; } timestamp_t ImpalaTimestampToTimestamp(const Int96 &raw_ts) { auto impala_us = ImpalaTimestampToMicroseconds(raw_ts); return Timestamp::FromEpochMicroSeconds(impala_us); } Int96 TimestampToImpalaTimestamp(timestamp_t &ts) { int32_t hour, min, sec, msec; Time::Convert(Timestamp::GetTime(ts), hour, min, sec, msec); uint64_t ms_since_midnight = hour * 60 * 60 * 1000 + min * 60 * 1000 + sec * 1000 + msec; auto days_since_epoch = Date::Epoch(Timestamp::GetDate(ts)) / int64_t(24 * 60 * 60); // first two uint32 in Int96 are nanoseconds since midnights // last uint32 is number of days since year 4713 BC ("Julian date") Int96 impala_ts; Store(ms_since_midnight * 1000000, data_ptr_cast(impala_ts.value)); impala_ts.value[2] = days_since_epoch + JULIAN_TO_UNIX_EPOCH_DAYS; return impala_ts; } timestamp_t ParquetTimestampMicrosToTimestamp(const int64_t &raw_ts) { return Timestamp::FromEpochMicroSeconds(raw_ts); } timestamp_t ParquetTimestampMsToTimestamp(const int64_t &raw_ts) { timestamp_t input(raw_ts); if (!Timestamp::IsFinite(input)) { return input; } return Timestamp::FromEpochMs(raw_ts); } timestamp_ns_t ParquetTimestampMsToTimestampNs(const int64_t &raw_ms) { timestamp_ns_t input; input.value = raw_ms; if (!Timestamp::IsFinite(input)) { return input; } return Timestamp::TimestampNsFromEpochMillis(raw_ms); } timestamp_ns_t ParquetTimestampUsToTimestampNs(const int64_t &raw_us) { timestamp_ns_t input; input.value = raw_us; if (!Timestamp::IsFinite(input)) { return input; } return Timestamp::TimestampNsFromEpochMicros(raw_us); } timestamp_ns_t ParquetTimestampNsToTimestampNs(const int64_t &raw_ns) { timestamp_ns_t result; result.value = raw_ns; return result; } timestamp_t ParquetTimestampNsToTimestamp(const int64_t &raw_ts) { timestamp_t input(raw_ts); if (!Timestamp::IsFinite(input)) { return input; } return Timestamp::FromEpochNanoSeconds(raw_ts); } date_t ParquetIntToDate(const int32_t &raw_date) { return date_t(raw_date); } template static T ParquetWrapTime(const T &raw, const T day) { // Special case 24:00:00 if (raw == day) { return raw; } const auto modulus = raw % day; return modulus + (modulus < 0) * day; } dtime_t ParquetMsIntToTime(const int32_t &raw_millis) { return Time::FromTimeMs(raw_millis); } dtime_t ParquetIntToTime(const int64_t &raw_micros) { return dtime_t(raw_micros); } dtime_t ParquetNsIntToTime(const int64_t &raw_nanos) { return Time::FromTimeNs(raw_nanos); } dtime_ns_t ParquetMsIntToTimeNs(const int32_t &raw_millis) { return dtime_ns_t(Interval::NANOS_PER_MSEC * raw_millis); } dtime_ns_t ParquetUsIntToTimeNs(const int64_t &raw_micros) { return dtime_ns_t(raw_micros * Interval::NANOS_PER_MICRO); } dtime_ns_t ParquetIntToTimeNs(const int64_t &raw_nanos) { return dtime_ns_t(raw_nanos); } dtime_tz_t ParquetIntToTimeMsTZ(const int32_t &raw_millis) { const int32_t MSECS_PER_DAY = Interval::MSECS_PER_SEC * Interval::SECS_PER_DAY; const auto millis = ParquetWrapTime(raw_millis, MSECS_PER_DAY); return dtime_tz_t(Time::FromTimeMs(millis), 0); } dtime_tz_t ParquetIntToTimeTZ(const int64_t &raw_micros) { const auto micros = ParquetWrapTime(raw_micros, Interval::MICROS_PER_DAY); return dtime_tz_t(dtime_t(micros), 0); } dtime_tz_t ParquetIntToTimeNsTZ(const int64_t &raw_nanos) { const auto nanos = ParquetWrapTime(raw_nanos, Interval::NANOS_PER_DAY); return dtime_tz_t(Time::FromTimeNs(nanos), 0); } } // namespace duckdb