| 1 | #include "duckdb/main/config.hpp" |
| 2 | #include "duckdb/function/compression_function.hpp" |
| 3 | #include "duckdb/function/compression/compression.hpp" |
| 4 | #include "duckdb/common/pair.hpp" |
| 5 | |
| 6 | namespace duckdb { |
| 7 | |
| 8 | typedef CompressionFunction (*get_compression_function_t)(PhysicalType type); |
| 9 | typedef bool (*compression_supports_type_t)(PhysicalType type); |
| 10 | |
| 11 | struct DefaultCompressionMethod { |
| 12 | CompressionType type; |
| 13 | get_compression_function_t get_function; |
| 14 | compression_supports_type_t supports_type; |
| 15 | }; |
| 16 | |
| 17 | static DefaultCompressionMethod internal_compression_methods[] = { |
| 18 | {.type: CompressionType::COMPRESSION_CONSTANT, .get_function: ConstantFun::GetFunction, .supports_type: ConstantFun::TypeIsSupported}, |
| 19 | {.type: CompressionType::COMPRESSION_UNCOMPRESSED, .get_function: UncompressedFun::GetFunction, .supports_type: UncompressedFun::TypeIsSupported}, |
| 20 | {.type: CompressionType::COMPRESSION_RLE, .get_function: RLEFun::GetFunction, .supports_type: RLEFun::TypeIsSupported}, |
| 21 | {.type: CompressionType::COMPRESSION_BITPACKING, .get_function: BitpackingFun::GetFunction, .supports_type: BitpackingFun::TypeIsSupported}, |
| 22 | {.type: CompressionType::COMPRESSION_DICTIONARY, .get_function: DictionaryCompressionFun::GetFunction, |
| 23 | .supports_type: DictionaryCompressionFun::TypeIsSupported}, |
| 24 | {.type: CompressionType::COMPRESSION_CHIMP, .get_function: ChimpCompressionFun::GetFunction, .supports_type: ChimpCompressionFun::TypeIsSupported}, |
| 25 | {.type: CompressionType::COMPRESSION_PATAS, .get_function: PatasCompressionFun::GetFunction, .supports_type: PatasCompressionFun::TypeIsSupported}, |
| 26 | {.type: CompressionType::COMPRESSION_FSST, .get_function: FSSTFun::GetFunction, .supports_type: FSSTFun::TypeIsSupported}, |
| 27 | {.type: CompressionType::COMPRESSION_AUTO, .get_function: nullptr, .supports_type: nullptr}}; |
| 28 | |
| 29 | static optional_ptr<CompressionFunction> FindCompressionFunction(CompressionFunctionSet &set, CompressionType type, |
| 30 | PhysicalType data_type) { |
| 31 | auto &functions = set.functions; |
| 32 | auto comp_entry = functions.find(x: type); |
| 33 | if (comp_entry != functions.end()) { |
| 34 | auto &type_functions = comp_entry->second; |
| 35 | auto type_entry = type_functions.find(x: data_type); |
| 36 | if (type_entry != type_functions.end()) { |
| 37 | return &type_entry->second; |
| 38 | } |
| 39 | } |
| 40 | return nullptr; |
| 41 | } |
| 42 | |
| 43 | static optional_ptr<CompressionFunction> LoadCompressionFunction(CompressionFunctionSet &set, CompressionType type, |
| 44 | PhysicalType data_type) { |
| 45 | for (idx_t index = 0; internal_compression_methods[index].get_function; index++) { |
| 46 | const auto &method = internal_compression_methods[index]; |
| 47 | if (method.type == type) { |
| 48 | // found the correct compression type |
| 49 | if (!method.supports_type(data_type)) { |
| 50 | // but it does not support this data type: bail out |
| 51 | return nullptr; |
| 52 | } |
| 53 | // the type is supported: create the function and insert it into the set |
| 54 | auto function = method.get_function(data_type); |
| 55 | set.functions[type].insert(x: make_pair(x&: data_type, y&: function)); |
| 56 | return FindCompressionFunction(set, type, data_type); |
| 57 | } |
| 58 | } |
| 59 | throw InternalException("Unsupported compression function type" ); |
| 60 | } |
| 61 | |
| 62 | static void TryLoadCompression(DBConfig &config, vector<reference<CompressionFunction>> &result, CompressionType type, |
| 63 | PhysicalType data_type) { |
| 64 | auto function = config.GetCompressionFunction(type, data_type); |
| 65 | if (!function) { |
| 66 | return; |
| 67 | } |
| 68 | result.push_back(x: *function); |
| 69 | } |
| 70 | |
| 71 | vector<reference<CompressionFunction>> DBConfig::GetCompressionFunctions(PhysicalType data_type) { |
| 72 | vector<reference<CompressionFunction>> result; |
| 73 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_UNCOMPRESSED, data_type); |
| 74 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_RLE, data_type); |
| 75 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_BITPACKING, data_type); |
| 76 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_DICTIONARY, data_type); |
| 77 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_CHIMP, data_type); |
| 78 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_PATAS, data_type); |
| 79 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_FSST, data_type); |
| 80 | return result; |
| 81 | } |
| 82 | |
| 83 | optional_ptr<CompressionFunction> DBConfig::GetCompressionFunction(CompressionType type, PhysicalType data_type) { |
| 84 | lock_guard<mutex> l(compression_functions->lock); |
| 85 | // check if the function is already loaded |
| 86 | auto function = FindCompressionFunction(set&: *compression_functions, type, data_type); |
| 87 | if (function) { |
| 88 | return function; |
| 89 | } |
| 90 | // else load the function |
| 91 | return LoadCompressionFunction(set&: *compression_functions, type, data_type); |
| 92 | } |
| 93 | |
| 94 | } // namespace duckdb |
| 95 | |