Fix MEMORY USAGE command (#14288)

After the key-value unification (kvobj), the MEMORY USAGE command may no longer account for the embedded key length stored within the kvobj. To fix this, replace sizeof(*o) with zmalloc_size((void *)o) to ensure the full allocated size is measured. In this context, the function objectComputeSize() was renamed and modified to kvobjComputeSize(). From computing only the value size to compute the key and its value.
2026-01-10 06:58:17 -05:00 · 2025-08-20 13:54:45 +03:00
parent ca9ede6968
commit e6c261f3fb
4 changed files with 51 additions and 21 deletions
--- a/src/object.c
+++ b/src/object.c
@@ -1202,24 +1202,27 @@ size_t streamRadixTreeMemoryUsage(rax *rax) {
    return size;
 }

-/* Returns the size in bytes consumed by the key's value in RAM.
+/* Returns the size in bytes consumed by the object header, key and value in RAM.
 * Note that the returned value is just an approximation, especially in the
 * case of aggregated data types where only "sample_size" elements
 * are checked and averaged to estimate the total size. */
 #define OBJ_COMPUTE_SIZE_DEF_SAMPLES 5 /* Default sample size. */
-size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
+size_t kvobjComputeSize(robj *key, kvobj *o, size_t sample_size, int dbid) {
    dict *d;
    dictIterator di;
    struct dictEntry *de;
-    size_t asize = 0, elesize = 0, elecount = 0, samples = 0;
+    size_t elesize = 0, elecount = 0, samples = 0;
+    
+    /* All kv-objects has at least kvobj header and embedded key */
+    size_t asize = zmalloc_size((void *)o);

    if (o->type == OBJ_STRING) {
        if(o->encoding == OBJ_ENCODING_INT) {
-            asize = sizeof(*o);
+            /* Value already counted (reuse the "ptr" in header to store int) */
        } else if(o->encoding == OBJ_ENCODING_RAW) {
-            asize = sdsZmallocSize(o->ptr)+sizeof(*o);
+            asize += sdsZmallocSize(o->ptr);
        } else if(o->encoding == OBJ_ENCODING_EMBSTR) {
-            asize = zmalloc_size((void *)o);
+            /* Value already counted (Value embedded in the object as well) */
        } else {
            serverPanic("Unknown string encoding");
        }
@@ -1227,7 +1230,7 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
        if (o->encoding == OBJ_ENCODING_QUICKLIST) {
            quicklist *ql = o->ptr;
            quicklistNode *node = ql->head;
-            asize = sizeof(*o)+sizeof(quicklist);
+            asize += sizeof(quicklist);
            do {
                elesize += sizeof(quicklistNode)+zmalloc_size(node->entry);
                elecount += node->count;
@@ -1235,7 +1238,7 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
            } while ((node = node->next) && samples < sample_size);
            asize += (double)elesize/elecount*ql->count;
        } else if (o->encoding == OBJ_ENCODING_LISTPACK) {
-            asize = sizeof(*o)+zmalloc_size(o->ptr);
+            asize += zmalloc_size(o->ptr);
        } else {
            serverPanic("Unknown list encoding");
        }
@@ -1243,7 +1246,7 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
        if (o->encoding == OBJ_ENCODING_HT) {
            d = o->ptr;
            dictInitIterator(&di, d);
-            asize = sizeof(*o)+sizeof(dict)+(sizeof(struct dictEntry*)*dictBuckets(d));
+            asize += sizeof(dict) + (sizeof(struct dictEntry*) * dictBuckets(d));
            while((de = dictNext(&di)) != NULL && samples < sample_size) {
                sds ele = dictGetKey(de);
                elesize += dictEntryMemUsage(0) + sdsZmallocSize(ele);
@@ -1252,20 +1255,20 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
            dictResetIterator(&di);
            if (samples) asize += (double)elesize/samples*dictSize(d);
        } else if (o->encoding == OBJ_ENCODING_INTSET) {
-            asize = sizeof(*o)+zmalloc_size(o->ptr);
+            asize += zmalloc_size(o->ptr);
        } else if (o->encoding == OBJ_ENCODING_LISTPACK) {
-            asize = sizeof(*o)+zmalloc_size(o->ptr);
+            asize += zmalloc_size(o->ptr);
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (o->type == OBJ_ZSET) {
        if (o->encoding == OBJ_ENCODING_LISTPACK) {
-            asize = sizeof(*o)+zmalloc_size(o->ptr);
+            asize += zmalloc_size(o->ptr);
        } else if (o->encoding == OBJ_ENCODING_SKIPLIST) {
            d = ((zset*)o->ptr)->dict;
            zskiplist *zsl = ((zset*)o->ptr)->zsl;
            zskiplistNode *znode = zsl->header->level[0].forward;
-            asize = sizeof(*o)+sizeof(zset)+sizeof(zskiplist)+sizeof(dict)+
+            asize += sizeof(zset) + sizeof(zskiplist) + sizeof(dict) +
                    (sizeof(struct dictEntry*)*dictBuckets(d))+
                    zmalloc_size(zsl->header);
            while(znode != NULL && samples < sample_size) {
@@ -1280,14 +1283,14 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
        }
    } else if (o->type == OBJ_HASH) {
        if (o->encoding == OBJ_ENCODING_LISTPACK) {
-            asize = sizeof(*o)+zmalloc_size(o->ptr);
+            asize += zmalloc_size(o->ptr);
        } else if (o->encoding == OBJ_ENCODING_LISTPACK_EX) {
            listpackEx *lpt = o->ptr;
-            asize = sizeof(*o) + zmalloc_size(lpt) + zmalloc_size(lpt->lp);
+            asize += zmalloc_size(lpt) + zmalloc_size(lpt->lp);
        } else if (o->encoding == OBJ_ENCODING_HT) {
            d = o->ptr;
            dictInitIterator(&di, d);
-            asize = sizeof(*o)+sizeof(dict)+(sizeof(struct dictEntry*)*dictBuckets(d));
+            asize += sizeof(dict) + (sizeof(struct dictEntry*) * dictBuckets(d));
            while((de = dictNext(&di)) != NULL && samples < sample_size) {
                hfield ele = dictGetKey(de);
                sds ele2 = dictGetVal(de);
@@ -1302,7 +1305,7 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
        }
    } else if (o->type == OBJ_STREAM) {
        stream *s = o->ptr;
-        asize = sizeof(*o)+sizeof(*s);
+        asize += sizeof(*s);
        asize += streamRadixTreeMemoryUsage(s->rax);

        /* Now we have to add the listpacks. The last listpack is often non
@@ -1364,7 +1367,7 @@ size_t objectComputeSize(robj *key, robj *o, size_t sample_size, int dbid) {
            raxStop(&ri);
        }
    } else if (o->type == OBJ_MODULE) {
-        asize = moduleGetMemUsage(key, o, sample_size, dbid);
+        asize += moduleGetMemUsage(key, o, sample_size, dbid);
    } else {
        serverPanic("Unknown object type");
    }
@@ -1780,7 +1783,7 @@ NULL
            addReplyNull(c);
            return;
        }
-        size_t usage = objectComputeSize(c->argv[2], (robj *)kv, samples, c->db->id);
+        size_t usage = kvobjComputeSize(c->argv[2], kv, samples, c->db->id);
        addReplyLongLong(c,usage);
    } else if (!strcasecmp(c->argv[1]->ptr,"stats") && c->argc == 2) {
        struct redisMemOverhead *mh = getMemoryOverheadData();
--- a/tests/unit/type/hash.tcl
+++ b/tests/unit/type/hash.tcl
@@ -43,7 +43,7 @@ start_server {tags {"hash"}} {
        create_hash myhash $contents
        assert_encoding $type myhash

-        # coverage for objectComputeSize
+        # coverage for kvobjComputeSize
        assert_morethan [memory_usage myhash] 0

        test "HRANDFIELD - $type" {
--- a/tests/unit/type/list.tcl
+++ b/tests/unit/type/list.tcl
@@ -2241,7 +2241,7 @@ foreach {pop} {BLPOP BLMPOP_RIGHT} {
        set k [r lrange k 0 -1]
        set dump [r dump k]

-        # coverage for objectComputeSize
+        # coverage for kvobjComputeSize
        assert_morethan [memory_usage k] 0

        config_set sanitize-dump-payload no mayfail
--- a/tests/unit/type/string.tcl
+++ b/tests/unit/type/string.tcl
@@ -684,6 +684,33 @@ if {[string match {*jemalloc*} [s mem_allocator]]} {
        lappend res [r get bar]
    } {12 12}
    
+    # coverage for kvobjComputeSize
+    test {MEMORY USAGE - STRINGS} {
+        set sizes {1 5 8 15 16 17 31 32 33 63 64 65 127 128 129 255 256 257}
+        set hdrsize [expr {[s arch_bits] == 32 ? 12 : 16}]
+        
+        foreach ksize $sizes {
+            set key [string repeat "k" $ksize]
+            # OBJ_ENCODING_EMBSTR, OBJ_ENCODING_RAW        
+            foreach vsize $sizes {
+                set value [string repeat "v" $vsize]                        
+                r set $key $value
+                set memory_used [r memory usage $key]
+                set min [expr $hdrsize + $ksize + $vsize] 
+                assert_lessthan_equal $min $memory_used
+                set max [expr {32 > $min ? 64 : [expr $min * 2]}]
+                assert_morethan_equal $max $memory_used
+            }
+            
+            # OBJ_ENCODING_INT
+            foreach value {1 100 10000 10000000} {
+                r set $key $value
+                set min [expr $hdrsize + $ksize]
+                assert_lessthan_equal $min [r memory usage $key]
+            }
+        }
+    }
+    
    if {[string match {*jemalloc*} [s mem_allocator]]} {
        test {Check MEMORY USAGE for embedded key strings with jemalloc} {