rgw: simplify GCM key cache, IV layout, and endian encoding

author Matthew N. Heler <matthew.heler@hotmail.com>

Wed, 8 Apr 2026 11:42:53 +0000 (06:42 -0500)

committer Matthew N. Heler <matthew.heler@hotmail.com>

Wed, 20 May 2026 18:31:02 +0000 (13:31 -0500)
author Matthew N. Heler <matthew.heler@hotmail.com>
Wed, 8 Apr 2026 11:42:53 +0000 (06:42 -0500)
committer Matthew N. Heler <matthew.heler@hotmail.com>
Wed, 20 May 2026 18:31:02 +0000 (13:31 -0500)
diff --git a/src/crypto/isa-l/isal_crypto_accel.cc b/src/crypto/isa-l/isal_crypto_accel.cc

index 9efeb91e93f5b586a5af11cf86c36638d45ca440..7704996481281b4b0cfb673a2b389fae2215fbf9 100644 (file)
--- a/src/crypto/isa-l/isal_crypto_accel.cc
+++ b/src/crypto/isa-l/isal_crypto_accel.cc
@@ -48,38 +48,33 @@ bool ISALCryptoAccel::cbc_decrypt(unsigned char* out, const unsigned char* in, s
    return true;
  }
  
-/**
+/*
   * Thread-local GCM key cache to avoid re-running aes_gcm_pre_256() for
- * repeated keys. Key material is securely wiped on key change and thread exit.
+ * repeated keys. Key material is securely wiped on thread exit.
   */
+struct gcm_key_cache_t {
+  unsigned char last_key[CryptoAccel::AES_256_KEYSIZE];
+  alignas(16) gcm_key_data cached_gkey;
+
+  ~gcm_key_cache_t() {
+    ceph_memzero_s(last_key, sizeof(last_key), sizeof(last_key));
+    ceph_memzero_s(&cached_gkey, sizeof(cached_gkey), sizeof(cached_gkey));
+  }
+};
+
  static inline const gcm_key_data* get_cached_gcm_key(const unsigned char* key)
  {
-  struct gcm_key_cache_t {
-    bool valid = false;
-    unsigned char last_key[CryptoAccel::AES_256_KEYSIZE];
-    alignas(16) gcm_key_data cached_gkey;
-
-    void purge() {
-      if (valid) {
-        ceph_memzero_s(last_key, sizeof(last_key), sizeof(last_key));
-        ceph_memzero_s(&cached_gkey, sizeof(cached_gkey), sizeof(cached_gkey));
-        valid = false;
-      }
-    }
-
-    ~gcm_key_cache_t() { purge(); }
-  };
-
-  static thread_local gcm_key_cache_t cache;
-
-  if (!cache.valid || memcmp(cache.last_key, key, CryptoAccel::AES_256_KEYSIZE) != 0) {
-    cache.purge();
-    aes_gcm_pre_256(key, &cache.cached_gkey);
-    memcpy(cache.last_key, key, CryptoAccel::AES_256_KEYSIZE);
-    cache.valid = true;
+  static thread_local std::unique_ptr<gcm_key_cache_t> cache;
+
+  if (!cache)
+    cache = std::make_unique<gcm_key_cache_t>();
+
+  if (memcmp(cache->last_key, key, CryptoAccel::AES_256_KEYSIZE) != 0) {
+    aes_gcm_pre_256(key, &cache->cached_gkey);
+    memcpy(cache->last_key, key, CryptoAccel::AES_256_KEYSIZE);
    }
  
-  return &cache.cached_gkey;
+  return &cache->cached_gkey;
  }
  
  bool ISALCryptoAccel::gcm_encrypt(unsigned char* out, const unsigned char* in, size_t size,
diff --git a/src/rgw/rgw_crypt.cc b/src/rgw/rgw_crypt.cc

index 4fb2eef0d69979b479b8a5caa84eda25126bee11..f671e3ddd88a4a6392540c484ffd2723b80701c2 100644 (file)
--- a/src/rgw/rgw_crypt.cc
+++ b/src/rgw/rgw_crypt.cc
@@ -664,14 +664,6 @@ public:
    static const size_t CHUNK_SIZE = 4096;
    static const size_t ENCRYPTED_CHUNK_SIZE = CHUNK_SIZE + GCM_TAG_SIZE; // 4112
  
-  /**
-   * Combined index layout for IV derivation:
-   *   - Upper 24 bits: part_number (supports up to 16M parts; S3 limit is 10K)
-   *   - Lower 40 bits: chunk_index (supports up to 4 PB per part at 4KB chunks)
-   */
-  static constexpr unsigned CHUNK_INDEX_BITS = 40;
-  static constexpr uint64_t MAX_CHUNK_INDEX = (1ULL << CHUNK_INDEX_BITS) - 1;
-
    const DoutPrefixProvider* dpp;
  private:
    CephContext* cct;
@@ -897,19 +889,10 @@ public:
      return ENCRYPTED_CHUNK_SIZE;
    }
  
-  /**
-   * Encode chunk index as 8-byte big-endian AAD.
-   * Binds ciphertext to stream position, preventing chunk reordering attacks.
-   */
+  // Encode chunk index as 8-byte big-endian AAD for chunk reordering protection.
    static void encode_chunk_aad(uint8_t (&aad)[8], uint64_t chunk_index) {
-    aad[0] = (chunk_index >> 56) & 0xFF;
-    aad[1] = (chunk_index >> 48) & 0xFF;
-    aad[2] = (chunk_index >> 40) & 0xFF;
-    aad[3] = (chunk_index >> 32) & 0xFF;
-    aad[4] = (chunk_index >> 24) & 0xFF;
-    aad[5] = (chunk_index >> 16) & 0xFF;
-    aad[6] = (chunk_index >> 8) & 0xFF;
-    aad[7] = chunk_index & 0xFF;
+    uint64_t be = boost::endian::native_to_big(chunk_index);
+    memcpy(aad, &be, sizeof(be));
    }
  
    CryptoAccelRef get_gcm_accel()
@@ -1273,18 +1256,18 @@ public:
      return true;
    }
  
-  /**
+  /*
     * IV cursor for efficient sequential IV generation.
-   * Emits zero-based IV and increments per chunk.
+   * Emits a 96-bit IV and increments per chunk.
     *
-   * Combined index layout (64 bits):
-   *   - Upper 24 bits: part_number (supports up to 16M parts; S3 limit is 10K)
-   *   - Lower 40 bits: chunk_index (supports up to 1T chunks per part)
+   * IV layout (96 bits):
+   *   - Upper 32 bits: part_number (supports up to 4B parts; S3 limit is 10K)
+   *   - Lower 64 bits: chunk_index (supports up to 64 EB per part at 4KB chunks)
     */
    struct iv_cursor {
-    uint64_t lo;           // host-order low 64 bits of current IV
-    uint32_t hi;           // host-order high 32 bits of current IV
-    uint64_t chunk_index;  // current chunk index (for AAD)
+    uint32_t hi;           // part_number
+    uint64_t lo;           // chunk_index
+    uint64_t chunk_index;  // for AAD
  
      void emit(unsigned char (&iv)[AES_256_IVSIZE]) const {
        uint32_t be_hi = boost::endian::native_to_big(hi);
@@ -1295,32 +1278,15 @@ public:
  
      void advance() {
        lo++;
-      if (lo == 0) hi++;
        chunk_index++;
      }
    };
  
    bool init_iv_cursor(iv_cursor& cursor, off_t stream_offset) {
      ceph_assert(salt_initialized);
-
-    uint64_t chunk_index = stream_offset / CHUNK_SIZE;
-    if (chunk_index > MAX_CHUNK_INDEX) {
-      ldpp_dout(dpp, 0) << "ERROR: chunk_index " << chunk_index
-                        << " exceeds maximum " << MAX_CHUNK_INDEX
-                        << " - IV collision risk" << dendl;
-      return false;
-    }
-
-    cursor.chunk_index = chunk_index;
-    uint64_t combined_index =
-        (static_cast<uint64_t>(part_number_) << CHUNK_INDEX_BITS) | chunk_index;
-
-    /*
-     * Fixed zero IV base -- safe because derive_object_key() guarantees
-     * a unique key per object. IV uniqueness comes from the counter.
-     */
-    cursor.hi = 0;
-    cursor.lo = combined_index;
+    cursor.hi = part_number_;
+    cursor.lo = stream_offset / CHUNK_SIZE;
+    cursor.chunk_index = cursor.lo;
      return true;
    }
  };
author	Matthew N. Heler <matthew.heler@hotmail.com>
	Wed, 8 Apr 2026 11:42:53 +0000 (06:42 -0500)
committer	Matthew N. Heler <matthew.heler@hotmail.com>
	Wed, 20 May 2026 18:31:02 +0000 (13:31 -0500)
src/crypto/isa-l/isal_crypto_accel.cc		patch \| blob \| history
src/rgw/rgw_crypt.cc		patch \| blob \| history