// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #pragma once #include #include #include #include "arrow/util/concurrent_map.h" #include "parquet/encryption/file_key_material_store.h" #include "parquet/encryption/key_encryption_key.h" #include "parquet/encryption/key_toolkit.h" #include "parquet/encryption/kms_client.h" #include "parquet/platform.h" namespace parquet::encryption { // This class will generate "key metadata" from "data encryption key" and "master key", // following these steps: // 1. Wrap "data encryption key". There are 2 modes: // 1.1. single wrapping: encrypt "data encryption key" directly with "master encryption // key" // 1.2. double wrapping: 2 steps: // 1.2.1. "key encryption key" is randomized (see KeyEncryptionKey class) // 1.2.2. "data encryption key" is encrypted with the above "key encryption key" // 2. Create "key material" (see structure in KeyMaterial class) // 3. Create "key metadata" with "key material" inside or a reference to outside "key // material" (see structure in KeyMetadata class). class PARQUET_EXPORT FileKeyWrapper { public: static constexpr int kKeyEncryptionKeyLength = 16; static constexpr int kKeyEncryptionKeyIdLength = 16; /// key_toolkit and kms_connection_config is to get KmsClient from the cache or create /// KmsClient if it's not in the cache yet. cache_entry_lifetime_seconds is life time of /// KmsClient in the cache. key_material_store is to store "key material" outside /// parquet file, NULL if "key material" is stored inside parquet file. FileKeyWrapper(KeyToolkit* key_toolkit, const KmsConnectionConfig& kms_connection_config, std::shared_ptr key_material_store, double cache_entry_lifetime_seconds, bool double_wrapping); /// Creates key_metadata field for a given data key, via wrapping the key with the /// master key. /// When external key material is used, an identifier is usually generated automatically /// but may be specified explicitly to support key rotation, /// which requires keeping the same identifiers. std::string GetEncryptionKeyMetadata(const std::string& data_key, const std::string& master_key_id, bool is_footer_key, std::string key_id_in_file = ""); private: KeyEncryptionKey CreateKeyEncryptionKey(const std::string& master_key_id); /// A map of Master Encryption Key ID -> KeyEncryptionKey, for the current token std::shared_ptr<::arrow::util::ConcurrentMap> kek_per_master_key_id_; std::shared_ptr kms_client_; KmsConnectionConfig kms_connection_config_; std::shared_ptr key_material_store_; const double cache_entry_lifetime_seconds_; const bool double_wrapping_; uint16_t key_counter_; }; } // namespace parquet::encryption