rgw/dedup split-head

author Gabriel BenHanokh <gbenhano@redhat.com>

Mon, 1 Dec 2025 06:48:57 +0000 (06:48 +0000)

committer benhanokh <gbenhano@redhat.com>

Mon, 23 Feb 2026 09:32:25 +0000 (11:32 +0200)
author Gabriel BenHanokh <gbenhano@redhat.com>
Mon, 1 Dec 2025 06:48:57 +0000 (06:48 +0000)
committer benhanokh <gbenhano@redhat.com>
Mon, 23 Feb 2026 09:32:25 +0000 (11:32 +0200)
diff --git a/doc/radosgw/s3_objects_dedup.rst b/doc/radosgw/s3_objects_dedup.rst

index b8b1ffbefa4ab09d3a19aa409a13b6fcaa597172..ae62531de26bb29f041ec703db43d25ca3dd80eb 100644 (file)
--- a/doc/radosgw/s3_objects_dedup.rst
+++ b/doc/radosgw/s3_objects_dedup.rst
@@ -96,12 +96,7 @@ Dedup code can split the head object into 2 objects
  - a new tail-object with only data.
  
  The new-tail object will be deduped (unlike the head objects which can't be deduplicated)
-
-The split-Head mode is controlled by the following central configuration option:
-
-.. confval:: rgw_dedup_max_obj_size_for_split
-
-We will split head for objects with size smaller or equal to rgw_dedup_max_obj_size_for_split
+This feature is only enabled for RGW Objects without existing tail-objects (in other words object-size <= 4MB)
  
  ************
  Memory Usage
diff --git a/src/common/options/rgw.yaml.in b/src/common/options/rgw.yaml.in

index 06ee99ec185af8d55611ec60af176a24246fda68..bbb0a6ed2d75fd82f200b8f60e56976e896adb39 100644 (file)
--- a/src/common/options/rgw.yaml.in
+++ b/src/common/options/rgw.yaml.in
@@ -81,25 +81,10 @@ options:
    default: false
    services:
    - rgw
-- name: rgw_dedup_max_obj_size_for_split
-  type: size
-  level: advanced
-  desc: The maximum RGW object size to split head.
-        A value of 0 (zero) disables the split-head functionality
-  long_desc: Dedup code can split head object into 2 objects -
-             one with attributes and no data and
-             a new tail-object with only data.
-             The new-tail object will be deduped (unlike the head objects which
-             can't be deduplicated)
-             We will split head for objects with size 16MB or less
-  default: 16_M
-  services:
-  - rgw
-  with_legacy: true
  - name: rgw_dedup_min_obj_size_for_dedup
    type: size
    level: advanced
-  desc: The minimum RGW object size for dedup (0 means dedup all objects).
+  desc: The minimum RGW object size for dedup (0 means no minimum size for dedup).
    default: 64_K
    services:
    - rgw
diff --git a/src/rgw/driver/rados/rgw_dedup.cc b/src/rgw/driver/rados/rgw_dedup.cc

index c1174bc7ef4f8e607b46e86404ff4bf5d719c4b3..19792969b8b84c9aa34fcf42adc2e366c5dc2f3b 100644 (file)
--- a/src/rgw/driver/rados/rgw_dedup.cc
+++ b/src/rgw/driver/rados/rgw_dedup.cc
@@ -84,10 +84,16 @@ namespace rgw::dedup {
    using storage_class_idx_t = uint8_t;
  
    //---------------------------------------------------------------------------
-  [[maybe_unused]] static int print_manifest(const DoutPrefixProvider *dpp,
+  [[maybe_unused]] static int print_manifest(CephContext              *cct,
+                                             const DoutPrefixProvider *dpp,
                                               RGWRados                 *rados,
                                               const RGWObjManifest     &manifest)
    {
+    bool debug = cct->_conf->subsys.should_gather<ceph_subsys_rgw_dedup, 20>();
+    if (!debug) {
+      return 0;
+    }
+
      unsigned idx = 0;
      for (auto p = manifest.obj_begin(dpp); p != manifest.obj_end(dpp); ++p, ++idx) {
        rgw_raw_obj raw_obj = p.get_location().get_raw_obj(rados);
@@ -407,8 +413,9 @@ namespace rgw::dedup {
    {
      d_head_object_size = cct->_conf->rgw_max_chunk_size;
      d_min_obj_size_for_dedup = cct->_conf->rgw_dedup_min_obj_size_for_dedup;
-    d_max_obj_size_for_split = cct->_conf->rgw_dedup_max_obj_size_for_split;
  
+    // limit split head to objects without tail
+    d_max_obj_size_for_split = d_head_object_size;
      ldpp_dout(dpp, 10) << "Config Vals::d_head_object_size=" << d_head_object_size
                         << "::d_min_obj_size_for_dedup=" << d_min_obj_size_for_dedup
                         << "::d_max_obj_size_for_split=" << d_max_obj_size_for_split
@@ -543,8 +550,8 @@ namespace rgw::dedup {
                                  const std::string &obj_name,
                                  const std::string &instance,
                                  const rgw_bucket &rb,
-                                librados::IoCtx *p_ioctx,
-                                std::string *p_oid)
+                                librados::IoCtx *p_ioctx /*OUT*/,
+                                std::string *p_oid /*OUT*/)
    {
      unique_ptr<rgw::sal::Bucket> bucket;
      {
@@ -569,8 +576,8 @@ namespace rgw::dedup {
                                rgw::sal::Driver* driver,
                                rgw::sal::RadosStore* store,
                                const disk_record_t *p_rec,
-                              librados::IoCtx *p_ioctx,
-                              std::string *p_oid)
+                              librados::IoCtx *p_ioctx /*OUT*/,
+                              std::string *p_oid /*OUT*/)
    {
      rgw_bucket b{p_rec->tenant_name, p_rec->bucket_name, p_rec->bucket_id};
      return get_ioctx_internal(dpp, driver, store, p_rec->obj_name, p_rec->instance,
@@ -618,10 +625,8 @@ namespace rgw::dedup {
    //---------------------------------------------------------------------------
    inline bool Background::should_split_head(uint64_t head_size, uint64_t obj_size)
    {
-    // max_obj_size_for_split of zero means don't split!
-    return (head_size > 0            &&
-            d_max_obj_size_for_split &&
-            obj_size <= d_max_obj_size_for_split);
+    // Don't split RGW objects with existing tail-objects
+    return (head_size > 0 && head_size == obj_size);
    }
  
    //---------------------------------------------------------------------------
@@ -962,6 +967,7 @@ namespace rgw::dedup {
  
      const string &ref_tag = p_tgt_rec->ref_tag;
      ldpp_dout(dpp, 20) << __func__ << "::ref_tag=" << ref_tag << dendl;
+    // src_manifest was updated in split-head case to include the new_tail
      ret = inc_ref_count_by_manifest(ref_tag, src_oid, src_manifest);
      if (unlikely(ret != 0)) {
        if (p_src_rec->s.flags.is_split_head()) {
@@ -1019,7 +1025,6 @@ namespace rgw::dedup {
        bufferlist new_manifest_bl;
        adjust_target_manifest(src_manifest, tgt_manifest, new_manifest_bl);
        tgt_op.setxattr(RGW_ATTR_MANIFEST, new_manifest_bl);
-      //tgt_op.setxattr(RGW_ATTR_MANIFEST, p_src_rec->manifest_bl);
        if (p_tgt_rec->s.flags.hash_calculated()) {
          tgt_op.setxattr(RGW_ATTR_BLAKE3, tgt_hash_bl);
          ldpp_dout(dpp, 20) << __func__ <<"::Set TGT Strong Hash in CLS"<< dendl;
@@ -1387,7 +1392,8 @@ namespace rgw::dedup {
                                                                ondisk_byte_size);
        p_stats->shared_manifest_dedup_bytes += dedupable_objects_bytes;
        ldpp_dout(dpp, 20) << __func__ << "::(1)skipped shared_manifest, SRC::block_id="
-                         << src_val.block_idx << "::rec_id=" << (int)src_val.rec_id << dendl;
+                         << src_val.get_src_block_id()
+                         << "::rec_id=" << (int)src_val.get_src_rec_id() << dendl;
        return 0;
      }
  
@@ -1500,7 +1506,7 @@ namespace rgw::dedup {
      librados::ObjectWriteOperation op;
      etag_to_bufferlist(p_rec->s.md5_high, p_rec->s.md5_low, p_rec->s.num_parts,
                         &etag_bl);
-    init_cmp_pairs(dpp, p_rec, etag_bl, hash_bl /*OUT PARAM*/, &op);
+    init_cmp_pairs(dpp, p_rec, etag_bl, hash_bl /*OUT*/, &op);
      op.setxattr(RGW_ATTR_BLAKE3, hash_bl);
  
      std::string oid;
@@ -1541,12 +1547,12 @@ namespace rgw::dedup {
    //---------------------------------------------------------------------------
    static int read_hash_and_manifest(const DoutPrefixProvider *const dpp,
                                      rgw::sal::Driver *driver,
-                                    RGWRados *rados,
+                                    rgw::sal::RadosStore *store,
                                      disk_record_t *p_rec)
    {
      librados::IoCtx ioctx;
      std::string oid;
-    int ret = get_ioctx(dpp, driver, rados, p_rec, &ioctx, &oid);
+    int ret = get_ioctx(dpp, driver, store, p_rec, &ioctx, &oid);
      if (unlikely(ret != 0)) {
        ldpp_dout(dpp, 5) << __func__ << "::ERR: failed get_ioctx()" << dendl;
        return ret;
@@ -1598,10 +1604,27 @@ namespace rgw::dedup {
    }
  
    //---------------------------------------------------------------------------
-  static void set_explicit_manifest(RGWObjManifest *p_manifest,
-                                    std::map<uint64_t, RGWObjManifestPart> &objs_map)
+  static void build_and_set_explicit_manifest(const DoutPrefixProvider *dpp,
+                                              const rgw_bucket *p_bucket,
+                                              const std::string &tail_name,
+                                              RGWObjManifest *p_manifest)
    {
      uint64_t obj_size = p_manifest->get_obj_size();
+    ceph_assert(obj_size == p_manifest->get_head_size());
+
+    const rgw_obj &head_obj = p_manifest->get_obj();
+    const rgw_obj_key &head_key = head_obj.key;
+    rgw_obj_key tail_key(tail_name, head_key.instance, head_key.ns);
+    rgw_obj tail_obj(*p_bucket, tail_key);
+
+    RGWObjManifestPart tail_part;
+    tail_part.loc     = tail_obj;
+    tail_part.loc_ofs = 0;
+    tail_part.size    = obj_size;
+
+    std::map<uint64_t, RGWObjManifestPart> objs_map;
+    objs_map[0] = tail_part;
+
      p_manifest->set_head_size(0);
      p_manifest->set_max_head_size(0);
      p_manifest->set_prefix("");
@@ -1609,68 +1632,6 @@ namespace rgw::dedup {
      p_manifest->set_explicit(obj_size, objs_map);
    }
  
-  //---------------------------------------------------------------------------
-  // This code is based on RGWObjManifest::convert_to_explicit()
-  static void build_explicit_objs_map(const DoutPrefixProvider *dpp,
-                                      RGWRados *rados,
-                                      const RGWObjManifest &manifest,
-                                      const rgw_bucket *p_bucket,
-                                      std::map<uint64_t, RGWObjManifestPart> *p_objs_map,
-                                      const std::string &tail_name,
-                                      md5_stats_t *p_stats)
-  {
-    bool manifest_raw_obj_logged = false;
-    unsigned idx = 0;
-    auto p = manifest.obj_begin(dpp);
-    while (p != manifest.obj_end(dpp)) {
-      const uint64_t offset = p.get_stripe_ofs();
-      const rgw_obj_select& os = p.get_location();
-      ldpp_dout(dpp, 20) << __func__ << "::[" << idx <<"]OBJ: "
-                         << os.get_raw_obj(rados).oid << "::ofs=" << p.get_ofs()
-                         << "::strp_offset=" << offset << dendl;
-
-      RGWObjManifestPart& part = (*p_objs_map)[offset];
-      part.loc_ofs = 0;
-
-      if (offset == 0) {
-        ldpp_dout(dpp, 20) << __func__ << "::[" << idx <<"] HEAD OBJ: "
-                           << os.get_raw_obj(rados).oid << dendl;
-        const rgw_obj &head_obj = manifest.get_obj();
-        const rgw_obj_key &head_key = head_obj.key;
-        // TBD: Can we have different instance/ns values for head/tail ??
-        // Should we take the instance/ns from the head or tail?
-        // Maybe should refuse objects with different instance/ns on head/tail ?
-        rgw_obj_key tail_key(tail_name, head_key.instance, head_key.ns);
-        rgw_obj tail_obj(*p_bucket, tail_key);
-        part.loc = tail_obj;
-      }
-      else {
-        // RGWObjManifest::convert_to_explicit() is assuming raw_obj, but looking
-        // at the RGWObjManifest::obj_iterator code it is clear the obj is not raw.
-        // If it happens to be raw we still handle it correctly (and inc stat-count)
-        std::optional<rgw_obj> obj_opt = os.get_head_obj();
-        if (obj_opt.has_value()) {
-          part.loc = obj_opt.value();
-        }
-        else {
-          // report raw object in manifest only once
-          if (!manifest_raw_obj_logged) {
-            manifest_raw_obj_logged = true;
-            ldpp_dout(dpp, 10) << __func__ << "::WARN: obj is_raw" << dendl;
-            p_stats->manifest_raw_obj++;
-          }
-          const rgw_raw_obj& raw = os.get_raw_obj(rados);
-          RGWSI_Tier_RADOS::raw_obj_to_obj(*p_bucket, raw, &part.loc);
-        }
-      }
-
-      ++p;
-      uint64_t next_offset = p.get_stripe_ofs();
-      part.size = next_offset - offset;
-      idx++;
-    } // while (p != manifest.obj_end())
-  }
-
    //---------------------------------------------------------------------------
    int Background::split_head_object(disk_record_t *p_src_rec, // IN-OUT PARAM
                                      RGWObjManifest &src_manifest, // IN/OUT PARAM
@@ -1685,7 +1646,7 @@ namespace rgw::dedup {
      bufferlist bl;
      std::string head_oid;
      librados::IoCtx ioctx;
-    int ret = get_ioctx(dpp, driver, rados, p_src_rec, &ioctx, &head_oid);
+    int ret = get_ioctx(dpp, driver, store, p_src_rec, &ioctx, &head_oid);
      if (unlikely(ret != 0)) {
        ldpp_dout(dpp, 1) << __func__ << "::ERR: failed get_ioctx()" << dendl;
        return ret;
@@ -1722,7 +1683,6 @@ namespace rgw::dedup {
        }
      }
  
-    bool exclusive = true; // block overwrite
      std::string tail_name = generate_split_head_tail_name(src_manifest);
      const rgw_bucket_placement &tail_placement = src_manifest.get_tail_placement();
      // Tail placement_rule was fixed before committed to SLAB, if looks bad -> abort
@@ -1742,6 +1702,7 @@ namespace rgw::dedup {
        return ret;
      }
  
+    bool exclusive = true; // block overwrite
      ret = tail_ioctx.create(tail_oid, exclusive);
      if (ret == 0) {
        ldpp_dout(dpp, 20) << __func__ << "::successfully created: " << tail_oid << dendl;
@@ -1764,7 +1725,11 @@ namespace rgw::dedup {
        ldpp_dout(dpp, 1) << __func__ << "::ERROR: failed to write " << tail_oid
                          << " with: " << cpp_strerror(-ret) << dendl;
        // don't leave orphan object behind
-      tail_ioctx.remove(tail_oid);
+      int ret_rmv = tail_ioctx.remove(tail_oid);
+      if (ret_rmv != 0) {
+        ldpp_dout(dpp, 1) << __func__ << "::ERROR: failed to remove " << tail_oid
+                          << " with: " << cpp_strerror(-ret_rmv) << dendl;
+      }
        return ret;
      }
      else {
@@ -1772,10 +1737,7 @@ namespace rgw::dedup {
                           << ret << dendl;
      }
  
-    std::map<uint64_t, RGWObjManifestPart> objs_map;
-    build_explicit_objs_map(dpp, rados, src_manifest, p_bucket, &objs_map,
-                            tail_name, p_stats);
-    set_explicit_manifest(&src_manifest, objs_map);
+    build_and_set_explicit_manifest(dpp, p_bucket, tail_name, &src_manifest);
  
      bufferlist manifest_bl;
      encode(src_manifest, manifest_bl);
@@ -1812,7 +1774,7 @@ namespace rgw::dedup {
        // read the manifest and strong hash from the head-object attributes
        ldpp_dout(dpp, 20) << __func__ << "::Fetch SRC strong hash from head-object::"
                           << p_src_rec->obj_name << dendl;
-      if (unlikely(read_hash_and_manifest(dpp, driver, rados, p_src_rec) != 0)) {
+      if (unlikely(read_hash_and_manifest(dpp, driver, store, p_src_rec) != 0)) {
          return false;
        }
        try {
@@ -1852,11 +1814,11 @@ namespace rgw::dedup {
    }
  
    //---------------------------------------------------------------------------
-  static bool parse_manifests(const DoutPrefixProvider *dpp,
-                              const disk_record_t *p_src_rec,
-                              const disk_record_t *p_tgt_rec,
-                              RGWObjManifest      *p_src_manifest,
-                              RGWObjManifest      *p_tgt_manifest)
+  static int parse_manifests(const DoutPrefixProvider *dpp,
+                             const disk_record_t *p_src_rec,
+                             const disk_record_t *p_tgt_rec,
+                             RGWObjManifest      *p_src_manifest,
+                             RGWObjManifest      *p_tgt_manifest)
    {
      bool valid_src_manifest = false;
      try {
@@ -1884,11 +1846,24 @@ namespace rgw::dedup {
                                        const RGWObjManifest &tgt_manifest,
                                        md5_stats_t          *p_stats)
    {
+    // The only case leading to this scenario is server-side-copy
+
+    // server-side-copy can only share tail-objects
+    // since no tail-objects exists -> no sharing could be possible
+    if (!tgt_manifest.has_tail()) {
+      return false;
+    }
+
+    // tail object with non-explicit manifest are simply prefix plus running count
+    if (!tgt_manifest.has_explicit_objs() && !src_manifest.has_explicit_objs()) {
+      return (tgt_manifest.get_prefix() == src_manifest.get_prefix());
+    }
+
      // Build a vector with all tail-objects on the SRC and then iterate over
      // the TGT tail-objects looking for a single tail-object in both manifets.
-    // If found -> abort the dedup
-    // The only case leading to this scenario is server-side-copy
-    // It is probably enough to scan the first few tail-objects, but better safe...
+    // It is enough to scan the first few tail-objects
+
+    constexpr unsigned MAX_OBJ_TO_COMPARE = 4;
      std::string src_oid = build_oid(p_src_rec->bucket_id, p_src_rec->obj_name);
      std::string tgt_oid = build_oid(p_tgt_rec->bucket_id, p_tgt_rec->obj_name);
      std::vector<std::string> vec;
@@ -1902,9 +1877,12 @@ namespace rgw::dedup {
        else {
          ldpp_dout(dpp, 20) << __func__ << "::[" << idx <<"] Skip HEAD OBJ: "
                             << raw_obj.oid << dendl;
-        continue;
+      }
+      if (idx >= MAX_OBJ_TO_COMPARE) {
+        break;
        }
      }
+
      idx = 0;
      for (auto p = tgt_manifest.obj_begin(dpp); p != tgt_manifest.obj_end(dpp); ++p, ++idx) {
        rgw_raw_obj raw_obj = p.get_location().get_raw_obj(rados);
@@ -1923,7 +1901,9 @@ namespace rgw::dedup {
        else {
          ldpp_dout(dpp, 20) << __func__ << "::[" << idx <<"] Skip HEAD OBJ: "
                             << raw_obj.oid << dendl;
-        continue;
+      }
+      if (idx >= MAX_OBJ_TO_COMPARE) {
+        break;
        }
      }
  
@@ -2036,6 +2016,7 @@ namespace rgw::dedup {
        return 0;
      }
  
+    RGWObjManifest src_manifest, tgt_manifest;
      ret = parse_manifests(dpp, p_src_rec, p_tgt_rec, &src_manifest, &tgt_manifest);
      if (unlikely(ret != 0)) {
        return 0;
diff --git a/src/rgw/driver/rados/rgw_dedup_table.cc b/src/rgw/driver/rados/rgw_dedup_table.cc

index d86896473a1819ebf8093542a94dc67dbf48c823..b27bf7353a6eedf63699c9bfa8f0792cdf369353 100644 (file)
--- a/src/rgw/driver/rados/rgw_dedup_table.cc
+++ b/src/rgw/driver/rados/rgw_dedup_table.cc
@@ -34,7 +34,6 @@ namespace rgw::dedup {
      memset(p_slab, 0, slab_size);
      hash_tab = (table_entry_t*)p_slab;
      entries_count = slab_size/sizeof(table_entry_t);
-    values_count = 0;
      occupied_count = 0;
    }
  
@@ -113,17 +112,16 @@ namespace rgw::dedup {
    }
  
    //---------------------------------------------------------------------------
-  static void inc_counters(const key_t *p_key,
-                           uint32_t head_object_size,
-                           dedup_stats_t *p_small_objs,
-                           dedup_stats_t *p_big_objs,
-                           uint64_t *p_duplicate_head_bytes)
+  void dedup_table_t::inc_counters(const key_t *p_key,
+                                   dedup_stats_t *p_small_objs,
+                                   dedup_stats_t *p_big_objs,
+                                   uint64_t *p_duplicate_head_bytes)
    {
      // This is an approximation only since size is stored in 4KB resolution
      uint64_t byte_size_approx = disk_blocks_to_byte_size(p_key->size_4k_units);
  
      // skip small single part objects which we can't dedup
-    if (!p_key->multipart_object() && (byte_size_approx <= head_object_size)) {
+    if (!dedupable_object(p_key->multipart_object(), min_obj_size_for_dedup, byte_size_approx)) {
        p_small_objs->duplicate_count ++;
        p_small_objs->dedup_bytes_estimate += byte_size_approx;
        return;
@@ -139,7 +137,7 @@ namespace rgw::dedup {
  
        // object smaller than max_obj_size_for_split will split their head
        // and won't dup it
-      if (!key.multipart_object() && byte_size_approx > max_obj_size_for_split) {
+      if (!p_key->multipart_object() && byte_size_approx > max_obj_size_for_split) {
          // single part objects duplicate the head object when dedup is used
          *p_duplicate_head_bytes += head_object_size;
        }
@@ -174,8 +172,7 @@ namespace rgw::dedup {
      else {
        ceph_assert(hash_tab[idx].key == *p_key);
        if (val.count <= MAX_COPIES_PER_OBJ) {
-        inc_counters(p_key, head_object_size, p_small_objs, p_big_objs,
-                     p_duplicate_head_bytes);
+        inc_counters(p_key, p_small_objs, p_big_objs, p_duplicate_head_bytes);
        }
        if (val.count < std::numeric_limits<std::uint16_t>::max()) {
          val.count ++;
@@ -190,7 +187,6 @@ namespace rgw::dedup {
        }
        ceph_assert(val.count > 1);
      }
-    values_count++;
      ldpp_dout(dpp, 20) << __func__ << "::COUNT="<< val.count << dendl;
      return 0;
    }
diff --git a/src/rgw/driver/rados/rgw_dedup_table.h b/src/rgw/driver/rados/rgw_dedup_table.h

index 501cb20d9aa590951bb45923ade7745c313de9fd..82efc03480cb4330a3411f4c1ef4b0d762e1457e 100644 (file)
--- a/src/rgw/driver/rados/rgw_dedup_table.h
+++ b/src/rgw/driver/rados/rgw_dedup_table.h
@@ -108,12 +108,12 @@ namespace rgw::dedup {
        inline uint16_t        get_count() { return this->count; }
        inline disk_block_id_t get_src_block_id() { return this->block_idx; }
        inline record_id_t     get_src_rec_id() { return this->rec_id; }
+      inline bool has_valid_hash() const {return flags.has_valid_hash(); }
      private:
        inline void set_shared_manifest_src() { this->flags.set_shared_manifest(); }
        inline void inc_count() { count ++; }
        inline void reset_count() { count = 0; }
        inline void clear_flags() { flags.clear(); }
-      inline bool has_valid_hash() const {return flags.has_valid_hash(); }
        inline void set_has_valid_hash_src() { this->flags.set_has_valid_hash(); }
        inline bool is_singleton() const { return (count == 1); }
        inline bool is_occupied() const { return flags.is_occupied(); }
@@ -172,7 +172,11 @@ namespace rgw::dedup {
      static_assert(sizeof(table_entry_t) == 32);
  
      uint32_t find_entry(const key_t *p_key) const;
-    uint32_t       values_count = 0;
+    void     inc_counters(const key_t *p_key,
+                          dedup_stats_t *p_small_objs,
+                          dedup_stats_t *p_big_objs,
+                          uint64_t *p_duplicate_head_bytes);
+
      uint32_t       entries_count = 0;
      uint32_t       occupied_count = 0;
      uint32_t       head_object_size;
diff --git a/src/test/rgw/dedup/test_dedup.py b/src/test/rgw/dedup/test_dedup.py

index f24857e3d993f20d0b73c554536054bbc198b978..15b746a537a6294e39faf9d8b75c6192c27dea29 100644 (file)
--- a/src/test/rgw/dedup/test_dedup.py
+++ b/src/test/rgw/dedup/test_dedup.py
@@ -282,7 +282,7 @@ KB=(1024)
  MB=(1024*KB)
  POTENTIAL_OBJ_SIZE=(64*KB)
  DEDUP_MIN_OBJ_SIZE=(64*KB)
-SPLIT_HEAD_SIZE=(16*MB)
+SPLIT_HEAD_SIZE=(4*MB)
  RADOS_OBJ_SIZE=(4*MB)
  # The default multipart threshold size for S3cmd is 15 MB.
  MULTIPART_SIZE=(15*MB)
@@ -412,7 +412,7 @@ def count_objects_in_bucket(bucket_name, conn):
  
          listing=conn.list_objects_v2(**list_args)
          if 'Contents' not in listing or len(listing['Contents'])== 0:
-            return 0
+            return obj_count
  
          obj_count += len(listing['Contents'])
  
@@ -424,14 +424,6 @@ def count_objects_in_bucket(bucket_name, conn):
              return obj_count
  
  
-#-------------------------------------------------------------------------------
-def copy_obj(base_bucket_name, base_key, bucket_name, key):
-    s3_prefix="s3://"
-    src  = s3_prefix + base_bucket_name + "/" + base_key
-    dest = s3_prefix + bucket_name + "/" + key
-    result = bash(['s3cmd', 'cp', src, dest])
-    assert result[1] == 0
-
  #-------------------------------------------------------------------------------
  def count_object_parts_in_all_buckets(verbose=False, expected_size=0):
      result = rados(['lspools'])
@@ -454,7 +446,7 @@ def count_object_parts_in_all_buckets(verbose=False, expected_size=0):
      if (rados_count > 1000):
          ### we can only do about 10 stat call per-second!!
          ### TBD: add obj_size to ls output to allow more efficient size check
-        log.info(">>> rados obj_count(%d) is too high -> skip stat check\n",
+        log.info(">>> rados obj_count(%d) is too high -> skip stat check",
                   len(names))
          expected_size = 0
  
@@ -503,7 +495,7 @@ def check_delete_objects_response(response):
          for error in response['Errors']:
              log.error("delete_objects::ERROR::Key=%s, Code=%s, Message=%s",
                        error['Key'], error['Code'], error['Message'])
-
+        assert(0)
      else:
          log.debug("All objects deleted successfully.")
  
@@ -533,7 +525,7 @@ def delete_bucket_with_all_objects(bucket_name, conn):
          listing=conn.list_objects_v2(**list_args)
          if 'Contents' not in listing or len(listing['Contents'])== 0:
              log.debug("Bucket '%s' is empty, skipping...", bucket_name)
-            return
+            break
  
          objects=[]
          for obj in listing['Contents']:
@@ -792,7 +784,7 @@ def upload_objects(bucket_name, files, indices, conn, config, check_obj_count):
      log.debug("Based on calculation we should have %d duplicated tail objs", duplicated_tail_objs)
      log.debug("Based on calculation we should have %.2f MiB total in pool", total_space/MB)
      log.debug("Based on calculation we should have %.2f MiB duplicated space in pool", duplicated_space/MB)
-    log.info("split_head_objs=%d, rados_objects_total=%d, duplicated_tail_objs=%d",
+    log.debug("split_head_objs=%d, rados_objects_total=%d, duplicated_tail_objs=%d",
               split_head_objs, rados_objects_total, duplicated_tail_objs)
      expected_rados_obj_count_post_dedup=(split_head_objs+rados_objects_total-duplicated_tail_objs)
      log.debug("Post dedup expcted rados obj count = %d", expected_rados_obj_count_post_dedup)
@@ -895,7 +887,7 @@ def upload_objects_multi(files, conns, bucket_names, indices, config, check_obj_
              log.debug("upload_objects::<%s/%s>", bucket_names[ten_id], key)
  
      log.debug("==========================================")
-    log.debug("Summery:%d S3 objects were uploaded (%d rados objects), total size = %.2f MiB",
+    log.debug("Summary:%d S3 objects were uploaded (%d rados objects), total size = %.2f MiB",
                s3_objects_total, rados_objects_total, total_space/MB)
      log.debug("Based on calculation we should have %d rados objects", rados_objects_total)
      log.debug("Based on calculation we should have %d duplicated tail objs", duplicated_tail_objs)
@@ -978,7 +970,7 @@ def procs_upload_objects(files, conns, bucket_names, indices, config, check_obj_
          proc_list[idx].join()
  
      log.debug("==========================================")
-    log.debug("Summery:%d S3 objects were uploaded (%d rados objects), total size = %.2f MiB",
+    log.debug("Summary:%d S3 objects were uploaded (%d rados objects), total size = %.2f MiB",
                s3_objects_total, rados_objects_total, total_space/MB)
      log.debug("Based on calculation we should have %d rados objects", rados_objects_total)
      log.debug("Based on calculation we should have %d duplicated tail objs", duplicated_tail_objs)
@@ -1022,7 +1014,8 @@ def check_if_any_obj_exists(bucket_name, delete_list, conn):
                  key=obj['Key']
                  log.debug("check_if_any_obj_exists: key=%s", key)
                  if obj['Key'] in delete_set:
-                    log.info("key <%s> was found in bucket", key)
+                    log.warning("Deleted key <%s> was found in bucket", key)
+                    return True
  
          if 'NextContinuationToken' in listing:
              continuation_token = listing['NextContinuationToken']
@@ -1030,6 +1023,7 @@ def check_if_any_obj_exists(bucket_name, delete_list, conn):
          else:
              break
  
+    return False
  
  #-------------------------------------------------------------------------------
  def delete_objects_multi(conns, bucket_names, ten_id, object_keys):
@@ -1098,7 +1092,7 @@ def delete_dup_objects(bucket_name, files, conn):
      verify=True
      if verify:
          log.debug("delete_dup_objects: verify delete_list_total")
-        check_if_any_obj_exists(bucket_name, delete_list_total, conn)
+        assert(check_if_any_obj_exists(bucket_name, delete_list_total, conn)==False)
  
      # must call garbage collection for predictable count
      result = admin(['gc', 'process', '--include-all'])
@@ -1159,8 +1153,8 @@ def verify_objects_multi(files, conns, bucket_names, expected_results, config, d
          for i in range(1, num_copies):
              filecmp.clear_cache()
              key = gen_object_name(filename, i)
-            log.debug("comparing object %s with file %s", key, filename)
              ten_id = i % max_tenants
+            log.debug("comparing object %s/%s with file %s", bucket_names[ten_id], key, filename)
              conns[ten_id].download_file(bucket_names[ten_id], key, tmpfile,
                                          Config=config)
              equal = filecmp.cmp(tmpfile, OUT_DIR + filename, shallow=False)
@@ -1177,8 +1171,8 @@ def verify_objects_multi(files, conns, bucket_names, expected_results, config, d
      for f in files:
          filename=f[0]
          key = gen_object_name(filename, i)
-        log.debug("comparing object %s with file %s", key, filename)
          ten_id = i % max_tenants
+        log.debug("comparing object %s/%s with file %s", bucket_names[ten_id], key, filename)
          conns[ten_id].download_file(bucket_names[ten_id], key, tmpfile,
                                      Config=config)
          equal = filecmp.cmp(tmpfile, OUT_DIR + filename, shallow=False)
@@ -1305,13 +1299,16 @@ def read_full_dedup_stats(dedup_stats, md5_stats):
  
  
  #-------------------------------------------------------------------------------
-def read_dedup_ratio(json):
+def read_dedup_ratio(jstats, field):
      dedup_ratio=Dedup_Ratio()
+    json=jstats[field]
      dedup_ratio.s3_bytes_before=json['s3_bytes_before']
      dedup_ratio.s3_bytes_after=json['s3_bytes_after']
      dedup_ratio.ratio=json['dedup_ratio']
  
-    log.debug("Completed! ::ratio=%f", dedup_ratio.ratio)
+    log.debug("%s::before=%d, after=%d, ratio=%f", field,
+             dedup_ratio.s3_bytes_before, dedup_ratio.s3_bytes_after,
+             dedup_ratio.ratio)
      return dedup_ratio
  
  #-------------------------------------------------------------------------------
@@ -1388,8 +1385,8 @@ def read_dedup_stats(dry_run):
  
      dedup_work_was_completed=jstats['completed']
      if dedup_work_was_completed:
-        dedup_ratio_estimate=read_dedup_ratio(jstats['dedup_ratio_estimate'])
-        dedup_ratio_actual=read_dedup_ratio(jstats['dedup_ratio_actual'])
+        dedup_ratio_estimate=read_dedup_ratio(jstats, 'dedup_ratio_estimate')
+        dedup_ratio_actual=read_dedup_ratio(jstats, 'dedup_ratio_actual')
      else:
          log.debug("Uncompleted!")
  
@@ -1578,14 +1575,13 @@ def simple_dedup(conn, files, bucket_name, run_cleanup_after, config, dry_run):
          if dry_run == False:
              log.debug("Verify all objects")
              verify_objects(bucket_name, files, conn, expected_results, config, run_cleanup_after)
+
+        return ret
      finally:
          if run_cleanup_after:
              # cleanup must be executed even after a failure
              cleanup(bucket_name, conn)
  
-        return ret
-
-
  #-------------------------------------------------------------------------------
  def simple_dedup_with_tenants(files, conns, bucket_names, config, dry_run=False):
      indices=[0] * len(files)
@@ -1800,18 +1796,20 @@ def ver_calc_rados_obj_count(config, files, op_log):
  
      rados_obj_total  = 0
      duplicated_tail_objs = 0
+    split_head_objs = 0
      for key, value in size_dict.items():
          size = value
          num_copies = num_copies_dict[key]
          assert num_copies > 0
          rados_obj_count  = calc_rados_obj_count(num_copies, size, config)
          rados_obj_total += (rados_obj_count * num_copies)
+        split_head_objs += calc_split_objs_count(size, num_copies, config)
          duplicated_tail_objs += ((num_copies-1) * (rados_obj_count-1))
  
      # versioned buckets hold an extra rados-obj per versioned S3-Obj
      unique_s3_objs_count = len(unique_s3_objs)
      rados_obj_total += unique_s3_objs_count
-    rados_obj_count_post_dedup=(rados_obj_total-duplicated_tail_objs)
+    rados_obj_count_post_dedup=(split_head_objs+rados_obj_total-duplicated_tail_objs)
      log.debug("calc::rados_obj_total=%d, rados_obj_count_post_dedup=%d",
                rados_obj_total, rados_obj_count_post_dedup)
      return(rados_obj_total, rados_obj_count_post_dedup, unique_s3_objs_count)
@@ -1866,8 +1864,6 @@ def print_bucket_versioning(conn, bucket_name):
  # finally make sure no rados-object was left behind after the last ver was removed
  @pytest.mark.basic_test
  def test_dedup_with_versions():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -1886,6 +1882,7 @@ def test_dedup_with_versions():
          # enable versioning
          conn.put_bucket_versioning(Bucket=bucket_name,
                                     VersioningConfiguration={"Status": "Enabled"})
+        print_bucket_versioning(conn, bucket_name)
          ver_count=7
          first_time=True
          for i in range(0, ver_count):
@@ -2003,8 +2000,6 @@ def corrupt_etag(key, corruption, expected_dedup_stats):
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_etag_corruption():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2072,8 +2067,6 @@ def write_bin_file(files, bin_arr, filename):
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_md5_collisions():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2186,8 +2179,6 @@ def loop_dedup_split_head_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_split_head_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2199,11 +2190,10 @@ def test_dedup_split_head_with_tenants():
  #-------------------------------------------------------------------------------
  def loop_dedup_split_head():
      prepare_test()
-    #bucket_name = gen_bucket_name()
-    bucket_name = "bucket1"
+    bucket_name = "splitheadbucket"
      config=default_config
-    max_copies_count=4
      files=[]
+    max_copies_count=4
      num_files=11 # [16KB-32MB]
      base_size = 16*KB
      log.debug("generate files: base size=%d KiB, max_size=%d KiB",
@@ -2227,9 +2217,7 @@ def loop_dedup_split_head():
  
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
-def test_dedup_split_head():
-    #return
-
+def test_dedup_split_head_simple():
      if full_dedup_is_disabled():
          return
  
@@ -2285,20 +2273,67 @@ def dedup_copy_internal(multi_buckets):
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_copy():
-    #return
      dedup_copy_internal(False)
  
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_copy_multi_buckets():
-    #return
      dedup_copy_internal(True)
  
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
-def test_dedup_small():
-    #return
+def test_copy_after_dedup():
+    if full_dedup_is_disabled():
+        return
+
+    prepare_test()
+    log.debug("test_copy_after_dedup: connect to AWS ...")
+    max_copies_count=3
+    num_files=8
+    files=[]
+    min_size=8*MB
+
+    # create files in range [8MB, 32MB] aligned on RADOS_OBJ_SIZE
+    gen_files_in_range(files, num_files, min_size, min_size*4)
+
+    # add file with excatly MULTIPART_SIZE
+    write_random(files, MULTIPART_SIZE, 2, 2)
+    bucket_cp= gen_bucket_name()
+    bucket_names=[]
+    try:
+        conn = get_single_connection()
+        conn.create_bucket(Bucket=bucket_cp)
+        bucket_names=create_buckets(conn, max_copies_count)
+        conns=[conn] * max_copies_count
+        dry_run=False
+        ret = simple_dedup_with_tenants(files, conns, bucket_names, default_config,
+                                        dry_run)
+        expected_results = ret[0]
+        dedup_stats = ret[1]
  
+        cp_head_count=0
+        for f in files:
+            filename=f[0]
+            obj_size=f[1]
+            num_copies=f[2]
+            for i in range(0, num_copies):
+                key = gen_object_name(filename, i)
+                key_cp = key + "_cp"
+                bucket_name = bucket_names[i]
+                base_obj = {'Bucket': bucket_name, 'Key': key}
+                log.debug("copy_object({%s, %s} -> %s/%s", bucket_name, key, bucket_cp, key_cp);
+                conn.copy_object(CopySource=base_obj, Bucket=bucket_cp, Key=key_cp)
+                cp_head_count += 1
+
+        assert (expected_results + cp_head_count) == count_object_parts_in_all_buckets(False, 0)
+    finally:
+        # cleanup must be executed even after a failure
+        delete_bucket_with_all_objects(bucket_cp, conn)
+        cleanup_all_buckets(bucket_names, conns)
+
+#-------------------------------------------------------------------------------
+@pytest.mark.basic_test
+def test_dedup_small():
      if full_dedup_is_disabled():
          return
  
@@ -2311,8 +2346,6 @@ def test_dedup_small():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_small_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2363,8 +2396,6 @@ def test_dedup_small_with_tenants():
  #    should be made to the system
  @pytest.mark.basic_test
  def test_dedup_inc_0_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2415,8 +2446,6 @@ def test_dedup_inc_0_with_tenants():
  #    should be made to the system
  @pytest.mark.basic_test
  def test_dedup_inc_0():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2464,8 +2493,6 @@ def test_dedup_inc_0():
  # 3) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_1_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2534,8 +2561,6 @@ def test_dedup_inc_1_with_tenants():
  # 3) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_1():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2600,8 +2625,6 @@ def test_dedup_inc_1():
  # 4) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_2_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2678,8 +2701,6 @@ def test_dedup_inc_2_with_tenants():
  # 4) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_2():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2751,7 +2772,6 @@ def test_dedup_inc_2():
  # 3) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_with_remove_multi_tenants():
-    #return
      if full_dedup_is_disabled():
          return
  
@@ -2853,7 +2873,6 @@ def test_dedup_inc_with_remove_multi_tenants():
  # 3) Run another dedup
  @pytest.mark.basic_test
  def test_dedup_inc_with_remove():
-    #return
      if full_dedup_is_disabled():
          return
  
@@ -2951,8 +2970,6 @@ def test_dedup_inc_with_remove():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_multipart_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -2977,8 +2994,6 @@ def test_dedup_multipart_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_multipart():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3004,8 +3019,6 @@ def test_dedup_multipart():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_basic_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3022,8 +3035,6 @@ def test_dedup_basic_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_basic():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3046,8 +3057,6 @@ def test_dedup_basic():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_small_multipart_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3068,8 +3077,6 @@ def test_dedup_small_multipart_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_small_multipart():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3092,8 +3099,6 @@ def test_dedup_small_multipart():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_large_scale_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3112,8 +3117,6 @@ def test_dedup_large_scale_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_large_scale():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3132,8 +3135,6 @@ def test_dedup_large_scale():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_empty_bucket():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3213,8 +3214,6 @@ def inc_step_with_tenants(stats_base, files, conns, bucket_names, config):
  @pytest.mark.basic_test
  #@pytest.mark.inc_test
  def test_dedup_inc_loop_with_tenants():
-    #return
-
      if full_dedup_is_disabled():
          return
  
@@ -3254,8 +3253,6 @@ def test_dedup_inc_loop_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_small_with_tenants():
-    #return
-
      log.debug("test_dedup_dry_small_with_tenants: connect to AWS ...")
      prepare_test()
      max_copies_count=3
@@ -3294,8 +3291,6 @@ def test_dedup_dry_small_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_multipart():
-    #return
-
      prepare_test()
      bucket_name = gen_bucket_name()
      log.debug("test_dedup_dry_multipart: connect to AWS ...")
@@ -3319,8 +3314,6 @@ def test_dedup_dry_multipart():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_basic():
-    #return
-
      prepare_test()
      bucket_name = gen_bucket_name()
      log.debug("test_dedup_dry_basic: connect to AWS ...")
@@ -3338,8 +3331,6 @@ def test_dedup_dry_basic():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_small_multipart():
-    #return
-
      prepare_test()
      log.debug("test_dedup_dry_small_multipart: connect to AWS ...")
      config2 = TransferConfig(multipart_threshold=4*KB, multipart_chunksize=1*MB)
@@ -3359,8 +3350,6 @@ def test_dedup_dry_small_multipart():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_small():
-    #return
-
      bucket_name = gen_bucket_name()
      log.debug("test_dedup_dry_small: connect to AWS ...")
      conn=get_single_connection()
@@ -3376,8 +3365,6 @@ def test_dedup_dry_small():
  # 6) verify that dedup ratio is reported correctly
  @pytest.mark.basic_test
  def test_dedup_dry_small_large_mix():
-    #return
-
      dry_run=True
      log.debug("test_dedup_dry_small_large_mix: connect to AWS ...")
      prepare_test()
@@ -3421,8 +3408,6 @@ def test_dedup_dry_small_large_mix():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_basic_with_tenants():
-    #return
-
      prepare_test()
      max_copies_count=3
      num_files=23
@@ -3436,8 +3421,6 @@ def test_dedup_dry_basic_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_multipart_with_tenants():
-    #return
-
      prepare_test()
      log.debug("test_dedup_dry_multipart_with_tenants: connect to AWS ...")
      max_copies_count=3
@@ -3459,8 +3442,6 @@ def test_dedup_dry_multipart_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_small_multipart_with_tenants():
-    #return
-
      prepare_test()
      max_copies_count=4
      num_files=10
@@ -3478,8 +3459,6 @@ def test_dedup_dry_small_multipart_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_large_scale_with_tenants():
-    #return
-
      prepare_test()
      max_copies_count=3
      num_threads=64
@@ -3505,8 +3484,6 @@ def test_dedup_dry_large_scale_with_tenants():
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_dry_large_scale():
-    #return
-
      prepare_test()
      bucket_name = gen_bucket_name()
      max_copies_count=2
@@ -3592,6 +3569,7 @@ def calc_identical_copies_stats(files, conns, bucket_name, config):
  
  #-------------------------------------------------------------------------------
  def __test_dedup_identical_copies(files, config, dry_run, verify, force_clean=False):
+    finished=False
      num_threads=32
      bucket_name = "bucket1"
      conns=get_connections(num_threads)
@@ -3616,9 +3594,10 @@ def __test_dedup_identical_copies(files, config, dry_run, verify, force_clean=Fa
              end_time = time.time_ns()
              log.info("Verify all objects time = %d(sec)",
                       (end_time - start_time)/1_000_000_000)
+        finished=True
      finally:
          # cleanup must be executed even after a failure
-        if not dry_run or force_clean:
+        if not dry_run or force_clean or not finished:
              log.info("cleanup bucket")
              cleanup(bucket_name, conns[0])
  
@@ -3626,7 +3605,7 @@ def __test_dedup_identical_copies(files, config, dry_run, verify, force_clean=Fa
  @pytest.mark.basic_test
  def test_dedup_identical_copies_1():
      num_files=1
-    copies_count=64*1024+1
+    copies_count=1024
      size=64*KB
      config=default_config
      prepare_test()
@@ -3647,29 +3626,6 @@ def test_dedup_identical_copies_1():
      log.info("test_dedup_identical_copies:full test")
      __test_dedup_identical_copies(files, config, dry_run, verify, force)
  
-#-------------------------------------------------------------------------------
-@pytest.mark.basic_test
-def test_dedup_identical_copies_multipart():
-    num_files=1
-    copies_count=64*1024+1
-    size=16*KB
-    prepare_test()
-    files=[]
-    gen_files_fixed_copies(files, num_files, size, copies_count)
-    config=TransferConfig(multipart_threshold=size, multipart_chunksize=size)
-    # start with a dry_run
-    dry_run=True
-    verify=False
-    log.info("test_dedup_identical_copies_multipart:dry test")
-    __test_dedup_identical_copies(files, config, dry_run, verify)
-
-    # and then perform a full dedup
-    dry_run=False
-    verify=False
-    force_clean=True
-    log.info("test_dedup_identical_copies_multipart:full test")
-    __test_dedup_identical_copies(files, config, dry_run, verify, force_clean)
-
  #-------------------------------------------------------------------------------
  @pytest.mark.basic_test
  def test_dedup_identical_copies_multipart_small():
@@ -3680,6 +3636,7 @@ def test_dedup_identical_copies_multipart_small():
      files=[]
      gen_files_fixed_copies(files, num_files, size, copies_count)
      config=TransferConfig(multipart_threshold=size, multipart_chunksize=size)
+
      # start with a dry_run
      dry_run=True
      verify=False
@@ -3693,3 +3650,12 @@ def test_dedup_identical_copies_multipart_small():
      log.info("test_dedup_identical_copies_multipart:full test")
      __test_dedup_identical_copies(files, config, dry_run, verify, force_clean)
  
+
+#-------------------------------------------------------------------------------
+@pytest.mark.basic_test
+def test_copy_single_obj():
+    return
+    conn=get_single_connection()
+    base_obj = {'Bucket': "bucket2", 'Key': "rados2"}
+    conn.copy_object(CopySource=base_obj, Bucket="bucket3", Key="rados3")
+
diff --git a/src/test/rgw/dedup/tox.ini b/src/test/rgw/dedup/tox.ini

index ba86319fa318eee165cdaa9c857ac86e3494e3c2..4654252002513d169f8af85e2ea9842d8569726a 100644 (file)
--- a/src/test/rgw/dedup/tox.ini
+++ b/src/test/rgw/dedup/tox.ini
@@ -6,6 +6,6 @@ skipsdist = True
  deps = -rrequirements.txt
  passenv =
    DEDUPTESTS_CONF
-setenv =
-  PYTEST_ADDOPTS = --maxfail=1
+#setenv =
+#  PYTEST_ADDOPTS = --maxfail=1
  commands = pytest {posargs}
author	Gabriel BenHanokh <gbenhano@redhat.com>
	Mon, 1 Dec 2025 06:48:57 +0000 (06:48 +0000)
committer	benhanokh <gbenhano@redhat.com>
	Mon, 23 Feb 2026 09:32:25 +0000 (11:32 +0200)
doc/radosgw/s3_objects_dedup.rst		patch \| blob \| history
src/common/options/rgw.yaml.in		patch \| blob \| history
src/rgw/driver/rados/rgw_dedup.cc		patch \| blob \| history
src/rgw/driver/rados/rgw_dedup_table.cc		patch \| blob \| history
src/rgw/driver/rados/rgw_dedup_table.h		patch \| blob \| history
src/test/rgw/dedup/test_dedup.py		patch \| blob \| history
src/test/rgw/dedup/tox.ini		patch \| blob \| history