| 1 | #include "duckdb/main/config.hpp" | 
|---|
| 2 | #include "duckdb/function/compression_function.hpp" | 
|---|
| 3 | #include "duckdb/function/compression/compression.hpp" | 
|---|
| 4 | #include "duckdb/common/pair.hpp" | 
|---|
| 5 |  | 
|---|
| 6 | namespace duckdb { | 
|---|
| 7 |  | 
|---|
| 8 | typedef CompressionFunction (*get_compression_function_t)(PhysicalType type); | 
|---|
| 9 | typedef bool (*compression_supports_type_t)(PhysicalType type); | 
|---|
| 10 |  | 
|---|
| 11 | struct DefaultCompressionMethod { | 
|---|
| 12 | CompressionType type; | 
|---|
| 13 | get_compression_function_t get_function; | 
|---|
| 14 | compression_supports_type_t supports_type; | 
|---|
| 15 | }; | 
|---|
| 16 |  | 
|---|
| 17 | static DefaultCompressionMethod internal_compression_methods[] = { | 
|---|
| 18 | {.type: CompressionType::COMPRESSION_CONSTANT, .get_function: ConstantFun::GetFunction, .supports_type: ConstantFun::TypeIsSupported}, | 
|---|
| 19 | {.type: CompressionType::COMPRESSION_UNCOMPRESSED, .get_function: UncompressedFun::GetFunction, .supports_type: UncompressedFun::TypeIsSupported}, | 
|---|
| 20 | {.type: CompressionType::COMPRESSION_RLE, .get_function: RLEFun::GetFunction, .supports_type: RLEFun::TypeIsSupported}, | 
|---|
| 21 | {.type: CompressionType::COMPRESSION_BITPACKING, .get_function: BitpackingFun::GetFunction, .supports_type: BitpackingFun::TypeIsSupported}, | 
|---|
| 22 | {.type: CompressionType::COMPRESSION_DICTIONARY, .get_function: DictionaryCompressionFun::GetFunction, | 
|---|
| 23 | .supports_type: DictionaryCompressionFun::TypeIsSupported}, | 
|---|
| 24 | {.type: CompressionType::COMPRESSION_CHIMP, .get_function: ChimpCompressionFun::GetFunction, .supports_type: ChimpCompressionFun::TypeIsSupported}, | 
|---|
| 25 | {.type: CompressionType::COMPRESSION_PATAS, .get_function: PatasCompressionFun::GetFunction, .supports_type: PatasCompressionFun::TypeIsSupported}, | 
|---|
| 26 | {.type: CompressionType::COMPRESSION_FSST, .get_function: FSSTFun::GetFunction, .supports_type: FSSTFun::TypeIsSupported}, | 
|---|
| 27 | {.type: CompressionType::COMPRESSION_AUTO, .get_function: nullptr, .supports_type: nullptr}}; | 
|---|
| 28 |  | 
|---|
| 29 | static optional_ptr<CompressionFunction> FindCompressionFunction(CompressionFunctionSet &set, CompressionType type, | 
|---|
| 30 | PhysicalType data_type) { | 
|---|
| 31 | auto &functions = set.functions; | 
|---|
| 32 | auto comp_entry = functions.find(x: type); | 
|---|
| 33 | if (comp_entry != functions.end()) { | 
|---|
| 34 | auto &type_functions = comp_entry->second; | 
|---|
| 35 | auto type_entry = type_functions.find(x: data_type); | 
|---|
| 36 | if (type_entry != type_functions.end()) { | 
|---|
| 37 | return &type_entry->second; | 
|---|
| 38 | } | 
|---|
| 39 | } | 
|---|
| 40 | return nullptr; | 
|---|
| 41 | } | 
|---|
| 42 |  | 
|---|
| 43 | static optional_ptr<CompressionFunction> LoadCompressionFunction(CompressionFunctionSet &set, CompressionType type, | 
|---|
| 44 | PhysicalType data_type) { | 
|---|
| 45 | for (idx_t index = 0; internal_compression_methods[index].get_function; index++) { | 
|---|
| 46 | const auto &method = internal_compression_methods[index]; | 
|---|
| 47 | if (method.type == type) { | 
|---|
| 48 | // found the correct compression type | 
|---|
| 49 | if (!method.supports_type(data_type)) { | 
|---|
| 50 | // but it does not support this data type: bail out | 
|---|
| 51 | return nullptr; | 
|---|
| 52 | } | 
|---|
| 53 | // the type is supported: create the function and insert it into the set | 
|---|
| 54 | auto function = method.get_function(data_type); | 
|---|
| 55 | set.functions[type].insert(x: make_pair(x&: data_type, y&: function)); | 
|---|
| 56 | return FindCompressionFunction(set, type, data_type); | 
|---|
| 57 | } | 
|---|
| 58 | } | 
|---|
| 59 | throw InternalException( "Unsupported compression function type"); | 
|---|
| 60 | } | 
|---|
| 61 |  | 
|---|
| 62 | static void TryLoadCompression(DBConfig &config, vector<reference<CompressionFunction>> &result, CompressionType type, | 
|---|
| 63 | PhysicalType data_type) { | 
|---|
| 64 | auto function = config.GetCompressionFunction(type, data_type); | 
|---|
| 65 | if (!function) { | 
|---|
| 66 | return; | 
|---|
| 67 | } | 
|---|
| 68 | result.push_back(x: *function); | 
|---|
| 69 | } | 
|---|
| 70 |  | 
|---|
| 71 | vector<reference<CompressionFunction>> DBConfig::GetCompressionFunctions(PhysicalType data_type) { | 
|---|
| 72 | vector<reference<CompressionFunction>> result; | 
|---|
| 73 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_UNCOMPRESSED, data_type); | 
|---|
| 74 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_RLE, data_type); | 
|---|
| 75 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_BITPACKING, data_type); | 
|---|
| 76 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_DICTIONARY, data_type); | 
|---|
| 77 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_CHIMP, data_type); | 
|---|
| 78 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_PATAS, data_type); | 
|---|
| 79 | TryLoadCompression(config&: *this, result, type: CompressionType::COMPRESSION_FSST, data_type); | 
|---|
| 80 | return result; | 
|---|
| 81 | } | 
|---|
| 82 |  | 
|---|
| 83 | optional_ptr<CompressionFunction> DBConfig::GetCompressionFunction(CompressionType type, PhysicalType data_type) { | 
|---|
| 84 | lock_guard<mutex> l(compression_functions->lock); | 
|---|
| 85 | // check if the function is already loaded | 
|---|
| 86 | auto function = FindCompressionFunction(set&: *compression_functions, type, data_type); | 
|---|
| 87 | if (function) { | 
|---|
| 88 | return function; | 
|---|
| 89 | } | 
|---|
| 90 | // else load the function | 
|---|
| 91 | return LoadCompressionFunction(set&: *compression_functions, type, data_type); | 
|---|
| 92 | } | 
|---|
| 93 |  | 
|---|
| 94 | } // namespace duckdb | 
|---|
| 95 |  | 
|---|