OmniSciDB
a5dc49c757
|
#include <filesystem>
#include <mutex>
#include <shared_mutex>
#include <string>
#include <tuple>
#include <unordered_map>
#include <vector>
#include "QueryEngine/heavydbTypes.h"
Go to the source code of this file.
Classes | |
struct | ZStdNormalizationSummaryStats< T > |
Namespaces | |
FileUtilities | |
Enumerations | |
enum | BoundsType { Min, Max } |
enum | IntervalType { Inclusive, Exclusive } |
Functions | |
template<typename T > | |
std::pair< T, T > | get_column_min_max (Column< T > const &) |
std::pair< int32_t, int32_t > | get_column_min_max (Column< TextEncodingDict > const &) |
template<typename T > | |
NEVER_INLINE HOST double | get_column_mean (const T *data, const int64_t num_rows) |
template<typename T > | |
NEVER_INLINE HOST double | get_column_mean (const Column< T > &col) |
template<typename T > | |
NEVER_INLINE HOST double | get_column_std_dev (const Column< T > &col, const double mean) |
template<typename T > | |
NEVER_INLINE HOST double | get_column_std_dev (const T *data, const int64_t num_rows, const double mean) |
template<typename T > | |
void | z_std_normalize_col (const T *input_data, T *output_data, const int64_t num_rows, const double mean, const double std_dev) |
template<typename T > | |
std::vector< std::vector< T > > | z_std_normalize_data (const std::vector< T * > &input_data, const int64_t num_rows) |
template<typename T > | |
ZStdNormalizationSummaryStats< T > | z_std_normalize_data_with_summary_stats (const std::vector< T * > &input_data, const int64_t num_rows) |
template<typename T > | |
NEVER_INLINE HOST std::tuple < T, T, bool > | get_column_metadata (const Column< T > &col) |
NEVER_INLINE HOST std::tuple < int32_t, int32_t, bool > | get_column_metadata (const Column< TextEncodingDict > &col) |
template<typename T1 , typename T2 > | |
NEVER_INLINE HOST T1 | distance_in_meters (const T1 fromlon, const T1 fromlat, const T2 tolon, const T2 tolat) |
int64_t | x_y_bin_to_bin_index (const int64_t x_bin, const int64_t y_bin, const int64_t num_x_bins) |
std::pair< int64_t, int64_t > | bin_to_x_y_bin_indexes (const int64_t bin, const int64_t num_x_bins) |
std::vector < std::filesystem::path > | FileUtilities::get_fs_paths (const std::string &file_or_directory) |
template<typename T > | |
NEVER_INLINE HOST bool | is_valid_tf_input (const T input, const T bounds_val, const BoundsType bounds_type, const IntervalType interval_type) |
enum BoundsType |
Enumerator | |
---|---|
Min | |
Max |
Definition at line 121 of file TableFunctionsCommon.hpp.
enum IntervalType |
Enumerator | |
---|---|
Inclusive | |
Exclusive |
Definition at line 123 of file TableFunctionsCommon.hpp.
|
inline |
Definition at line 112 of file TableFunctionsCommon.hpp.
Referenced by GeoRaster< T, Z >::get_xy_coords_for_bin_idx().
NEVER_INLINE HOST T1 distance_in_meters | ( | const T1 | fromlon, |
const T1 | fromlat, | ||
const T2 | tolon, | ||
const T2 | tolat | ||
) |
Definition at line 452 of file TableFunctionsCommon.cpp.
NEVER_INLINE HOST double get_column_mean | ( | const T * | data, |
const int64_t | num_rows | ||
) |
Definition at line 116 of file TableFunctionsCommon.cpp.
References max_inputs_per_thread, threading_serial::parallel_for(), and heavydb.dtypes::T.
Referenced by get_column_mean(), r2_score_impl(), z_std_normalize_data(), and z_std_normalize_data_with_summary_stats().
NEVER_INLINE HOST double get_column_mean | ( | const Column< T > & | col | ) |
Definition at line 183 of file TableFunctionsCommon.cpp.
References get_column_mean(), Column< T >::getPtr(), and Column< T >::size().
NEVER_INLINE HOST std::tuple<T, T, bool> get_column_metadata | ( | const Column< T > & | col | ) |
Definition at line 276 of file TableFunctionsCommon.cpp.
References Column< T >::isNull(), max_inputs_per_thread, threading_serial::parallel_for(), Column< T >::size(), and heavydb.dtypes::T.
Referenced by get_column_metadata().
NEVER_INLINE HOST std::tuple<int32_t, int32_t, bool> get_column_metadata | ( | const Column< TextEncodingDict > & | col | ) |
Definition at line 358 of file TableFunctionsCommon.cpp.
References get_column_metadata(), Column< TextEncodingDict >::getPtr(), and Column< TextEncodingDict >::size().
std::pair<T, T> get_column_min_max | ( | Column< T > const & | ) |
Definition at line 42 of file TableFunctionsCommon.hpp.
std::pair<int32_t, int32_t> get_column_min_max | ( | Column< TextEncodingDict > const & | ) |
Definition at line 46 of file TableFunctionsCommon.hpp.
NEVER_INLINE HOST double get_column_std_dev | ( | const Column< T > & | col, |
const double | mean | ||
) |
Definition at line 195 of file TableFunctionsCommon.cpp.
References get_column_std_dev(), Column< T >::getPtr(), and Column< T >::size().
Referenced by get_column_std_dev(), z_std_normalize_data(), and z_std_normalize_data_with_summary_stats().
NEVER_INLINE HOST double get_column_std_dev | ( | const T * | data, |
const int64_t | num_rows, | ||
const double | mean | ||
) |
Definition at line 209 of file TableFunctionsCommon.cpp.
References max_inputs_per_thread, threading_serial::parallel_for(), and heavydb.dtypes::T.
NEVER_INLINE HOST bool is_valid_tf_input | ( | const T | input, |
const T | bounds_val, | ||
const BoundsType | bounds_type, | ||
const IntervalType | interval_type | ||
) |
Definition at line 556 of file TableFunctionsCommon.cpp.
References Exclusive, Inclusive, Max, Min, and UNREACHABLE.
|
inline |
Definition at line 106 of file TableFunctionsCommon.hpp.
Referenced by GeoRaster< T, Z >::calculate_slope_and_aspect(), GeoRaster< T, Z >::computeParallelImpl(), GeoRaster< T, Z >::computeSerialImpl(), GeoRaster< T, Z >::fill_bin_from_avg_box_neighborhood(), GeoRaster< T, Z >::fill_bin_from_box_neighborhood(), GeoRaster< T, Z >::fill_bins_from_box_neighborhood(), GeoRaster< T, Z >::fill_bins_from_gaussian_neighborhood(), GeoRaster< T, Z >::get_bin_idx_and_z_val_for_xy_bin(), GeoRaster< T, Z >::get_bin_idx_for_xy_coords(), GeoRaster< T, Z >::get_nxn_neighbors_if_not_null(), GeoRaster< T, Z >::offset_source_z_from_raster_z(), GeoRaster< T, Z >::outputDenseColumn(), GeoRaster< T, Z >::outputDenseColumns(), and GeoRaster< T, Z >::outputDenseColumnsAndFill().
void z_std_normalize_col | ( | const T * | input_data, |
T * | output_data, | ||
const int64_t | num_rows, | ||
const double | mean, | ||
const double | std_dev | ||
) |
Definition at line 365 of file TableFunctionsCommon.cpp.
References threading_serial::parallel_for().
Referenced by z_std_normalize_data(), and z_std_normalize_data_with_summary_stats().
std::vector<std::vector<T> > z_std_normalize_data | ( | const std::vector< T * > & | input_data, |
const int64_t | num_rows | ||
) |
Definition at line 397 of file TableFunctionsCommon.cpp.
References get_column_mean(), get_column_std_dev(), and z_std_normalize_col().
Referenced by dbscan__cpu_template(), and kmeans__cpu_template().
ZStdNormalizationSummaryStats<T> z_std_normalize_data_with_summary_stats | ( | const std::vector< T * > & | input_data, |
const int64_t | num_rows | ||
) |
Definition at line 422 of file TableFunctionsCommon.cpp.
References get_column_mean(), get_column_std_dev(), and z_std_normalize_col().
Referenced by pca_fit_impl().