Home | History | Annotate | Line # | Download | only in internal
      1      1.1  christos #ifndef JEMALLOC_INTERNAL_SIZE_H
      2      1.1  christos #define JEMALLOC_INTERNAL_SIZE_H
      3      1.1  christos 
      4      1.1  christos #include "jemalloc/internal/bit_util.h"
      5      1.1  christos #include "jemalloc/internal/pages.h"
      6  1.1.1.2  christos #include "jemalloc/internal/sc.h"
      7      1.1  christos #include "jemalloc/internal/util.h"
      8      1.1  christos 
      9      1.1  christos /*
     10      1.1  christos  * sz module: Size computations.
     11      1.1  christos  *
     12      1.1  christos  * Some abbreviations used here:
     13      1.1  christos  *   p: Page
     14      1.1  christos  *   ind: Index
     15      1.1  christos  *   s, sz: Size
     16      1.1  christos  *   u: Usable size
     17      1.1  christos  *   a: Aligned
     18      1.1  christos  *
     19      1.1  christos  * These are not always used completely consistently, but should be enough to
     20      1.1  christos  * interpret function names.  E.g. sz_psz2ind converts page size to page size
     21      1.1  christos  * index; sz_sa2u converts a (size, alignment) allocation request to the usable
     22      1.1  christos  * size that would result from such an allocation.
     23      1.1  christos  */
     24      1.1  christos 
     25  1.1.1.2  christos /* Page size index type. */
     26  1.1.1.2  christos typedef unsigned pszind_t;
     27  1.1.1.2  christos 
     28  1.1.1.2  christos /* Size class index type. */
     29  1.1.1.2  christos typedef unsigned szind_t;
     30  1.1.1.2  christos 
     31      1.1  christos /*
     32      1.1  christos  * sz_pind2sz_tab encodes the same information as could be computed by
     33      1.1  christos  * sz_pind2sz_compute().
     34      1.1  christos  */
     35  1.1.1.2  christos extern size_t sz_pind2sz_tab[SC_NPSIZES + 1];
     36      1.1  christos /*
     37      1.1  christos  * sz_index2size_tab encodes the same information as could be computed (at
     38      1.1  christos  * unacceptable cost in some code paths) by sz_index2size_compute().
     39      1.1  christos  */
     40  1.1.1.2  christos extern size_t sz_index2size_tab[SC_NSIZES];
     41      1.1  christos /*
     42      1.1  christos  * sz_size2index_tab is a compact lookup table that rounds request sizes up to
     43      1.1  christos  * size classes.  In order to reduce cache footprint, the table is compressed,
     44      1.1  christos  * and all accesses are via sz_size2index().
     45      1.1  christos  */
     46  1.1.1.2  christos extern uint8_t sz_size2index_tab[];
     47      1.1  christos 
     48  1.1.1.2  christos /*
     49  1.1.1.2  christos  * Padding for large allocations: PAGE when opt_cache_oblivious == true (to
     50  1.1.1.2  christos  * enable cache index randomization); 0 otherwise.
     51  1.1.1.2  christos  */
     52  1.1.1.2  christos extern size_t sz_large_pad;
     53  1.1.1.2  christos 
     54  1.1.1.2  christos extern void sz_boot(const sc_data_t *sc_data, bool cache_oblivious);
     55      1.1  christos 
     56      1.1  christos JEMALLOC_ALWAYS_INLINE pszind_t
     57      1.1  christos sz_psz2ind(size_t psz) {
     58  1.1.1.2  christos 	assert(psz > 0);
     59  1.1.1.2  christos 	if (unlikely(psz > SC_LARGE_MAXCLASS)) {
     60  1.1.1.2  christos 		return SC_NPSIZES;
     61      1.1  christos 	}
     62  1.1.1.2  christos 	/* x is the lg of the first base >= psz. */
     63  1.1.1.2  christos 	pszind_t x = lg_ceil(psz);
     64  1.1.1.2  christos 	/*
     65  1.1.1.2  christos 	 * sc.h introduces a lot of size classes. These size classes are divided
     66  1.1.1.2  christos 	 * into different size class groups. There is a very special size class
     67  1.1.1.2  christos 	 * group, each size class in or after it is an integer multiple of PAGE.
     68  1.1.1.2  christos 	 * We call it first_ps_rg. It means first page size regular group. The
     69  1.1.1.2  christos 	 * range of first_ps_rg is (base, base * 2], and base == PAGE *
     70  1.1.1.2  christos 	 * SC_NGROUP. off_to_first_ps_rg begins from 1, instead of 0. e.g.
     71  1.1.1.2  christos 	 * off_to_first_ps_rg is 1 when psz is (PAGE * SC_NGROUP + 1).
     72  1.1.1.2  christos 	 */
     73  1.1.1.2  christos 	pszind_t off_to_first_ps_rg = (x < SC_LG_NGROUP + LG_PAGE) ?
     74  1.1.1.2  christos 	    0 : x - (SC_LG_NGROUP + LG_PAGE);
     75      1.1  christos 
     76  1.1.1.2  christos 	/*
     77  1.1.1.2  christos 	 * Same as sc_s::lg_delta.
     78  1.1.1.2  christos 	 * Delta for off_to_first_ps_rg == 1 is PAGE,
     79  1.1.1.2  christos 	 * for each increase in offset, it's multiplied by two.
     80  1.1.1.2  christos 	 * Therefore, lg_delta = LG_PAGE + (off_to_first_ps_rg - 1).
     81  1.1.1.2  christos 	 */
     82  1.1.1.2  christos 	pszind_t lg_delta = (off_to_first_ps_rg == 0) ?
     83  1.1.1.2  christos 	    LG_PAGE : LG_PAGE + (off_to_first_ps_rg - 1);
     84      1.1  christos 
     85  1.1.1.2  christos 	/*
     86  1.1.1.2  christos 	 * Let's write psz in binary, e.g. 0011 for 0x3, 0111 for 0x7.
     87  1.1.1.2  christos 	 * The leftmost bits whose len is lg_base decide the base of psz.
     88  1.1.1.2  christos 	 * The rightmost bits whose len is lg_delta decide (pgz % PAGE).
     89  1.1.1.2  christos 	 * The middle bits whose len is SC_LG_NGROUP decide ndelta.
     90  1.1.1.2  christos 	 * ndelta is offset to the first size class in the size class group,
     91  1.1.1.2  christos 	 * starts from 1.
     92  1.1.1.2  christos 	 * If you don't know lg_base, ndelta or lg_delta, see sc.h.
     93  1.1.1.2  christos 	 * |xxxxxxxxxxxxxxxxxxxx|------------------------|yyyyyyyyyyyyyyyyyyyyy|
     94  1.1.1.2  christos 	 * |<-- len: lg_base -->|<-- len: SC_LG_NGROUP-->|<-- len: lg_delta -->|
     95  1.1.1.2  christos 	 *                      |<--      ndelta      -->|
     96  1.1.1.2  christos 	 * rg_inner_off = ndelta - 1
     97  1.1.1.2  christos 	 * Why use (psz - 1)?
     98  1.1.1.2  christos 	 * To handle case: psz % (1 << lg_delta) == 0.
     99  1.1.1.2  christos 	 */
    100  1.1.1.2  christos 	pszind_t rg_inner_off = (((psz - 1)) >> lg_delta) & (SC_NGROUP - 1);
    101      1.1  christos 
    102  1.1.1.2  christos 	pszind_t base_ind = off_to_first_ps_rg << SC_LG_NGROUP;
    103  1.1.1.2  christos 	pszind_t ind = base_ind + rg_inner_off;
    104  1.1.1.2  christos 	return ind;
    105      1.1  christos }
    106      1.1  christos 
    107      1.1  christos static inline size_t
    108      1.1  christos sz_pind2sz_compute(pszind_t pind) {
    109  1.1.1.2  christos 	if (unlikely(pind == SC_NPSIZES)) {
    110  1.1.1.2  christos 		return SC_LARGE_MAXCLASS + PAGE;
    111      1.1  christos 	}
    112  1.1.1.2  christos 	size_t grp = pind >> SC_LG_NGROUP;
    113  1.1.1.2  christos 	size_t mod = pind & ((ZU(1) << SC_LG_NGROUP) - 1);
    114      1.1  christos 
    115  1.1.1.2  christos 	size_t grp_size_mask = ~((!!grp)-1);
    116  1.1.1.2  christos 	size_t grp_size = ((ZU(1) << (LG_PAGE + (SC_LG_NGROUP-1))) << grp)
    117  1.1.1.2  christos 	    & grp_size_mask;
    118  1.1.1.2  christos 
    119  1.1.1.2  christos 	size_t shift = (grp == 0) ? 1 : grp;
    120  1.1.1.2  christos 	size_t lg_delta = shift + (LG_PAGE-1);
    121  1.1.1.2  christos 	size_t mod_size = (mod+1) << lg_delta;
    122      1.1  christos 
    123  1.1.1.2  christos 	size_t sz = grp_size + mod_size;
    124  1.1.1.2  christos 	return sz;
    125      1.1  christos }
    126      1.1  christos 
    127      1.1  christos static inline size_t
    128      1.1  christos sz_pind2sz_lookup(pszind_t pind) {
    129      1.1  christos 	size_t ret = (size_t)sz_pind2sz_tab[pind];
    130      1.1  christos 	assert(ret == sz_pind2sz_compute(pind));
    131      1.1  christos 	return ret;
    132      1.1  christos }
    133      1.1  christos 
    134      1.1  christos static inline size_t
    135      1.1  christos sz_pind2sz(pszind_t pind) {
    136  1.1.1.2  christos 	assert(pind < SC_NPSIZES + 1);
    137      1.1  christos 	return sz_pind2sz_lookup(pind);
    138      1.1  christos }
    139      1.1  christos 
    140      1.1  christos static inline size_t
    141      1.1  christos sz_psz2u(size_t psz) {
    142  1.1.1.2  christos 	if (unlikely(psz > SC_LARGE_MAXCLASS)) {
    143  1.1.1.2  christos 		return SC_LARGE_MAXCLASS + PAGE;
    144      1.1  christos 	}
    145  1.1.1.2  christos 	size_t x = lg_floor((psz<<1)-1);
    146  1.1.1.2  christos 	size_t lg_delta = (x < SC_LG_NGROUP + LG_PAGE + 1) ?
    147  1.1.1.2  christos 	    LG_PAGE : x - SC_LG_NGROUP - 1;
    148  1.1.1.2  christos 	size_t delta = ZU(1) << lg_delta;
    149  1.1.1.2  christos 	size_t delta_mask = delta - 1;
    150  1.1.1.2  christos 	size_t usize = (psz + delta_mask) & ~delta_mask;
    151  1.1.1.2  christos 	return usize;
    152      1.1  christos }
    153      1.1  christos 
    154      1.1  christos static inline szind_t
    155      1.1  christos sz_size2index_compute(size_t size) {
    156  1.1.1.2  christos 	if (unlikely(size > SC_LARGE_MAXCLASS)) {
    157  1.1.1.2  christos 		return SC_NSIZES;
    158      1.1  christos 	}
    159  1.1.1.2  christos 
    160  1.1.1.2  christos 	if (size == 0) {
    161  1.1.1.2  christos 		return 0;
    162  1.1.1.2  christos 	}
    163  1.1.1.2  christos #if (SC_NTINY != 0)
    164  1.1.1.2  christos 	if (size <= (ZU(1) << SC_LG_TINY_MAXCLASS)) {
    165  1.1.1.2  christos 		szind_t lg_tmin = SC_LG_TINY_MAXCLASS - SC_NTINY + 1;
    166      1.1  christos 		szind_t lg_ceil = lg_floor(pow2_ceil_zu(size));
    167      1.1  christos 		return (lg_ceil < lg_tmin ? 0 : lg_ceil - lg_tmin);
    168      1.1  christos 	}
    169      1.1  christos #endif
    170      1.1  christos 	{
    171      1.1  christos 		szind_t x = lg_floor((size<<1)-1);
    172  1.1.1.2  christos 		szind_t shift = (x < SC_LG_NGROUP + LG_QUANTUM) ? 0 :
    173  1.1.1.2  christos 		    x - (SC_LG_NGROUP + LG_QUANTUM);
    174  1.1.1.2  christos 		szind_t grp = shift << SC_LG_NGROUP;
    175      1.1  christos 
    176  1.1.1.2  christos 		szind_t lg_delta = (x < SC_LG_NGROUP + LG_QUANTUM + 1)
    177  1.1.1.2  christos 		    ? LG_QUANTUM : x - SC_LG_NGROUP - 1;
    178      1.1  christos 
    179      1.1  christos 		size_t delta_inverse_mask = ZU(-1) << lg_delta;
    180      1.1  christos 		szind_t mod = ((((size-1) & delta_inverse_mask) >> lg_delta)) &
    181  1.1.1.2  christos 		    ((ZU(1) << SC_LG_NGROUP) - 1);
    182      1.1  christos 
    183  1.1.1.2  christos 		szind_t index = SC_NTINY + grp + mod;
    184      1.1  christos 		return index;
    185      1.1  christos 	}
    186      1.1  christos }
    187      1.1  christos 
    188      1.1  christos JEMALLOC_ALWAYS_INLINE szind_t
    189  1.1.1.2  christos sz_size2index_lookup_impl(size_t size) {
    190  1.1.1.2  christos 	assert(size <= SC_LOOKUP_MAXCLASS);
    191  1.1.1.2  christos 	return sz_size2index_tab[(size + (ZU(1) << SC_LG_TINY_MIN) - 1)
    192  1.1.1.2  christos 	    >> SC_LG_TINY_MIN];
    193  1.1.1.2  christos }
    194  1.1.1.2  christos 
    195  1.1.1.2  christos JEMALLOC_ALWAYS_INLINE szind_t
    196      1.1  christos sz_size2index_lookup(size_t size) {
    197  1.1.1.2  christos 	szind_t ret = sz_size2index_lookup_impl(size);
    198  1.1.1.2  christos 	assert(ret == sz_size2index_compute(size));
    199  1.1.1.2  christos 	return ret;
    200      1.1  christos }
    201      1.1  christos 
    202      1.1  christos JEMALLOC_ALWAYS_INLINE szind_t
    203      1.1  christos sz_size2index(size_t size) {
    204  1.1.1.2  christos 	if (likely(size <= SC_LOOKUP_MAXCLASS)) {
    205      1.1  christos 		return sz_size2index_lookup(size);
    206      1.1  christos 	}
    207      1.1  christos 	return sz_size2index_compute(size);
    208      1.1  christos }
    209      1.1  christos 
    210      1.1  christos static inline size_t
    211      1.1  christos sz_index2size_compute(szind_t index) {
    212  1.1.1.2  christos #if (SC_NTINY > 0)
    213  1.1.1.2  christos 	if (index < SC_NTINY) {
    214  1.1.1.2  christos 		return (ZU(1) << (SC_LG_TINY_MAXCLASS - SC_NTINY + 1 + index));
    215      1.1  christos 	}
    216      1.1  christos #endif
    217      1.1  christos 	{
    218  1.1.1.2  christos 		size_t reduced_index = index - SC_NTINY;
    219  1.1.1.2  christos 		size_t grp = reduced_index >> SC_LG_NGROUP;
    220  1.1.1.2  christos 		size_t mod = reduced_index & ((ZU(1) << SC_LG_NGROUP) -
    221      1.1  christos 		    1);
    222      1.1  christos 
    223      1.1  christos 		size_t grp_size_mask = ~((!!grp)-1);
    224      1.1  christos 		size_t grp_size = ((ZU(1) << (LG_QUANTUM +
    225  1.1.1.2  christos 		    (SC_LG_NGROUP-1))) << grp) & grp_size_mask;
    226      1.1  christos 
    227      1.1  christos 		size_t shift = (grp == 0) ? 1 : grp;
    228      1.1  christos 		size_t lg_delta = shift + (LG_QUANTUM-1);
    229      1.1  christos 		size_t mod_size = (mod+1) << lg_delta;
    230      1.1  christos 
    231      1.1  christos 		size_t usize = grp_size + mod_size;
    232      1.1  christos 		return usize;
    233      1.1  christos 	}
    234      1.1  christos }
    235      1.1  christos 
    236      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    237  1.1.1.2  christos sz_index2size_lookup_impl(szind_t index) {
    238  1.1.1.2  christos 	return sz_index2size_tab[index];
    239  1.1.1.2  christos }
    240  1.1.1.2  christos 
    241  1.1.1.2  christos JEMALLOC_ALWAYS_INLINE size_t
    242      1.1  christos sz_index2size_lookup(szind_t index) {
    243  1.1.1.2  christos 	size_t ret = sz_index2size_lookup_impl(index);
    244      1.1  christos 	assert(ret == sz_index2size_compute(index));
    245      1.1  christos 	return ret;
    246      1.1  christos }
    247      1.1  christos 
    248      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    249      1.1  christos sz_index2size(szind_t index) {
    250  1.1.1.2  christos 	assert(index < SC_NSIZES);
    251      1.1  christos 	return sz_index2size_lookup(index);
    252      1.1  christos }
    253      1.1  christos 
    254  1.1.1.2  christos JEMALLOC_ALWAYS_INLINE void
    255  1.1.1.2  christos sz_size2index_usize_fastpath(size_t size, szind_t *ind, size_t *usize) {
    256  1.1.1.2  christos 	*ind = sz_size2index_lookup_impl(size);
    257  1.1.1.2  christos 	*usize = sz_index2size_lookup_impl(*ind);
    258  1.1.1.2  christos }
    259  1.1.1.2  christos 
    260      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    261      1.1  christos sz_s2u_compute(size_t size) {
    262  1.1.1.2  christos 	if (unlikely(size > SC_LARGE_MAXCLASS)) {
    263      1.1  christos 		return 0;
    264      1.1  christos 	}
    265  1.1.1.2  christos 
    266  1.1.1.2  christos 	if (size == 0) {
    267  1.1.1.2  christos 		size++;
    268  1.1.1.2  christos 	}
    269  1.1.1.2  christos #if (SC_NTINY > 0)
    270  1.1.1.2  christos 	if (size <= (ZU(1) << SC_LG_TINY_MAXCLASS)) {
    271  1.1.1.2  christos 		size_t lg_tmin = SC_LG_TINY_MAXCLASS - SC_NTINY + 1;
    272      1.1  christos 		size_t lg_ceil = lg_floor(pow2_ceil_zu(size));
    273      1.1  christos 		return (lg_ceil < lg_tmin ? (ZU(1) << lg_tmin) :
    274      1.1  christos 		    (ZU(1) << lg_ceil));
    275      1.1  christos 	}
    276      1.1  christos #endif
    277      1.1  christos 	{
    278      1.1  christos 		size_t x = lg_floor((size<<1)-1);
    279  1.1.1.2  christos 		size_t lg_delta = (x < SC_LG_NGROUP + LG_QUANTUM + 1)
    280  1.1.1.2  christos 		    ?  LG_QUANTUM : x - SC_LG_NGROUP - 1;
    281      1.1  christos 		size_t delta = ZU(1) << lg_delta;
    282      1.1  christos 		size_t delta_mask = delta - 1;
    283      1.1  christos 		size_t usize = (size + delta_mask) & ~delta_mask;
    284      1.1  christos 		return usize;
    285      1.1  christos 	}
    286      1.1  christos }
    287      1.1  christos 
    288      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    289      1.1  christos sz_s2u_lookup(size_t size) {
    290      1.1  christos 	size_t ret = sz_index2size_lookup(sz_size2index_lookup(size));
    291      1.1  christos 
    292      1.1  christos 	assert(ret == sz_s2u_compute(size));
    293      1.1  christos 	return ret;
    294      1.1  christos }
    295      1.1  christos 
    296      1.1  christos /*
    297      1.1  christos  * Compute usable size that would result from allocating an object with the
    298      1.1  christos  * specified size.
    299      1.1  christos  */
    300      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    301      1.1  christos sz_s2u(size_t size) {
    302  1.1.1.2  christos 	if (likely(size <= SC_LOOKUP_MAXCLASS)) {
    303      1.1  christos 		return sz_s2u_lookup(size);
    304      1.1  christos 	}
    305      1.1  christos 	return sz_s2u_compute(size);
    306      1.1  christos }
    307      1.1  christos 
    308      1.1  christos /*
    309      1.1  christos  * Compute usable size that would result from allocating an object with the
    310      1.1  christos  * specified size and alignment.
    311      1.1  christos  */
    312      1.1  christos JEMALLOC_ALWAYS_INLINE size_t
    313      1.1  christos sz_sa2u(size_t size, size_t alignment) {
    314      1.1  christos 	size_t usize;
    315      1.1  christos 
    316      1.1  christos 	assert(alignment != 0 && ((alignment - 1) & alignment) == 0);
    317      1.1  christos 
    318      1.1  christos 	/* Try for a small size class. */
    319  1.1.1.2  christos 	if (size <= SC_SMALL_MAXCLASS && alignment <= PAGE) {
    320      1.1  christos 		/*
    321      1.1  christos 		 * Round size up to the nearest multiple of alignment.
    322      1.1  christos 		 *
    323      1.1  christos 		 * This done, we can take advantage of the fact that for each
    324      1.1  christos 		 * small size class, every object is aligned at the smallest
    325      1.1  christos 		 * power of two that is non-zero in the base two representation
    326      1.1  christos 		 * of the size.  For example:
    327      1.1  christos 		 *
    328      1.1  christos 		 *   Size |   Base 2 | Minimum alignment
    329      1.1  christos 		 *   -----+----------+------------------
    330      1.1  christos 		 *     96 |  1100000 |  32
    331      1.1  christos 		 *    144 | 10100000 |  32
    332      1.1  christos 		 *    192 | 11000000 |  64
    333      1.1  christos 		 */
    334      1.1  christos 		usize = sz_s2u(ALIGNMENT_CEILING(size, alignment));
    335  1.1.1.2  christos 		if (usize < SC_LARGE_MINCLASS) {
    336      1.1  christos 			return usize;
    337      1.1  christos 		}
    338      1.1  christos 	}
    339      1.1  christos 
    340      1.1  christos 	/* Large size class.  Beware of overflow. */
    341      1.1  christos 
    342  1.1.1.2  christos 	if (unlikely(alignment > SC_LARGE_MAXCLASS)) {
    343      1.1  christos 		return 0;
    344      1.1  christos 	}
    345      1.1  christos 
    346      1.1  christos 	/* Make sure result is a large size class. */
    347  1.1.1.2  christos 	if (size <= SC_LARGE_MINCLASS) {
    348  1.1.1.2  christos 		usize = SC_LARGE_MINCLASS;
    349      1.1  christos 	} else {
    350      1.1  christos 		usize = sz_s2u(size);
    351      1.1  christos 		if (usize < size) {
    352      1.1  christos 			/* size_t overflow. */
    353      1.1  christos 			return 0;
    354      1.1  christos 		}
    355      1.1  christos 	}
    356      1.1  christos 
    357      1.1  christos 	/*
    358      1.1  christos 	 * Calculate the multi-page mapping that large_palloc() would need in
    359      1.1  christos 	 * order to guarantee the alignment.
    360      1.1  christos 	 */
    361      1.1  christos 	if (usize + sz_large_pad + PAGE_CEILING(alignment) - PAGE < usize) {
    362      1.1  christos 		/* size_t overflow. */
    363      1.1  christos 		return 0;
    364      1.1  christos 	}
    365      1.1  christos 	return usize;
    366      1.1  christos }
    367      1.1  christos 
    368  1.1.1.2  christos size_t sz_psz_quantize_floor(size_t size);
    369  1.1.1.2  christos size_t sz_psz_quantize_ceil(size_t size);
    370  1.1.1.2  christos 
    371      1.1  christos #endif /* JEMALLOC_INTERNAL_SIZE_H */
    372