diff options
| author | H.J. Lu <hjl.tools@gmail.com> | 2024-11-26 16:15:25 +0800 |
|---|---|---|
| committer | H.J. Lu <hjl.tools@gmail.com> | 2024-12-04 04:28:15 +0800 |
| commit | 1c4cebb84b9e33aea9a90adfadb031d1f1eba927 (patch) | |
| tree | b8c59eb6388c942da858d8a1881e739c17493d73 /malloc | |
| parent | f43eb2cf30fdff39bda1c2018246d4badabbc576 (diff) | |
| download | glibc-1c4cebb84b9e33aea9a90adfadb031d1f1eba927.tar.xz glibc-1c4cebb84b9e33aea9a90adfadb031d1f1eba927.zip | |
malloc: Optimize small memory clearing for calloc
Add calloc-clear-memory.h to clear memory size up to 36 bytes (72 bytes
on 64-bit targets) for calloc. Use repeated stores with 1 branch, instead
of up to 3 branches. On x86-64, it is faster than memset since calling
memset needs 1 indirect branch, 1 broadcast, and up to 4 branches.
Signed-off-by: H.J. Lu <hjl.tools@gmail.com>
Reviewed-by: Wilco Dijkstra <Wilco.Dijkstra@arm.com>
Diffstat (limited to 'malloc')
| -rw-r--r-- | malloc/malloc-internal.h | 1 | ||||
| -rw-r--r-- | malloc/malloc.c | 36 |
2 files changed, 2 insertions, 35 deletions
diff --git a/malloc/malloc-internal.h b/malloc/malloc-internal.h index cba03433fe..3349e2d1fe 100644 --- a/malloc/malloc-internal.h +++ b/malloc/malloc-internal.h @@ -23,6 +23,7 @@ #include <malloc-sysdep.h> #include <malloc-size.h> #include <malloc-hugepages.h> +#include <calloc-clear-memory.h> /* Called in the parent process before a fork. */ void __malloc_fork_lock_parent (void) attribute_hidden; diff --git a/malloc/malloc.c b/malloc/malloc.c index 287fa0904d..ac3901bdd5 100644 --- a/malloc/malloc.c +++ b/malloc/malloc.c @@ -3755,8 +3755,6 @@ __libc_calloc (size_t n, size_t elem_size) INTERNAL_SIZE_T sz, oldtopsize; void *mem; unsigned long clearsize; - unsigned long nclears; - INTERNAL_SIZE_T *d; ptrdiff_t bytes; if (__glibc_unlikely (__builtin_mul_overflow (n, elem_size, &bytes))) @@ -3853,40 +3851,8 @@ __libc_calloc (size_t n, size_t elem_size) } #endif - /* Unroll clear of <= 36 bytes (72 if 8byte sizes). We know that - contents have an odd number of INTERNAL_SIZE_T-sized words; - minimally 3. */ - d = (INTERNAL_SIZE_T *) mem; clearsize = csz - SIZE_SZ; - nclears = clearsize / sizeof (INTERNAL_SIZE_T); - assert (nclears >= 3); - - if (nclears > 9) - return memset (d, 0, clearsize); - - else - { - *(d + 0) = 0; - *(d + 1) = 0; - *(d + 2) = 0; - if (nclears > 4) - { - *(d + 3) = 0; - *(d + 4) = 0; - if (nclears > 6) - { - *(d + 5) = 0; - *(d + 6) = 0; - if (nclears > 8) - { - *(d + 7) = 0; - *(d + 8) = 0; - } - } - } - } - - return mem; + return clear_memory ((INTERNAL_SIZE_T *) mem, clearsize); } #endif /* IS_IN (libc) */ |
