1 1.1 christos #ifndef JEMALLOC_INTERNAL_SIZE_H 2 1.1 christos #define JEMALLOC_INTERNAL_SIZE_H 3 1.1 christos 4 1.1 christos #include "jemalloc/internal/bit_util.h" 5 1.1 christos #include "jemalloc/internal/pages.h" 6 1.1.1.2 christos #include "jemalloc/internal/sc.h" 7 1.1 christos #include "jemalloc/internal/util.h" 8 1.1 christos 9 1.1 christos /* 10 1.1 christos * sz module: Size computations. 11 1.1 christos * 12 1.1 christos * Some abbreviations used here: 13 1.1 christos * p: Page 14 1.1 christos * ind: Index 15 1.1 christos * s, sz: Size 16 1.1 christos * u: Usable size 17 1.1 christos * a: Aligned 18 1.1 christos * 19 1.1 christos * These are not always used completely consistently, but should be enough to 20 1.1 christos * interpret function names. E.g. sz_psz2ind converts page size to page size 21 1.1 christos * index; sz_sa2u converts a (size, alignment) allocation request to the usable 22 1.1 christos * size that would result from such an allocation. 23 1.1 christos */ 24 1.1 christos 25 1.1.1.2 christos /* Page size index type. */ 26 1.1.1.2 christos typedef unsigned pszind_t; 27 1.1.1.2 christos 28 1.1.1.2 christos /* Size class index type. */ 29 1.1.1.2 christos typedef unsigned szind_t; 30 1.1.1.2 christos 31 1.1 christos /* 32 1.1 christos * sz_pind2sz_tab encodes the same information as could be computed by 33 1.1 christos * sz_pind2sz_compute(). 34 1.1 christos */ 35 1.1.1.2 christos extern size_t sz_pind2sz_tab[SC_NPSIZES + 1]; 36 1.1 christos /* 37 1.1 christos * sz_index2size_tab encodes the same information as could be computed (at 38 1.1 christos * unacceptable cost in some code paths) by sz_index2size_compute(). 39 1.1 christos */ 40 1.1.1.2 christos extern size_t sz_index2size_tab[SC_NSIZES]; 41 1.1 christos /* 42 1.1 christos * sz_size2index_tab is a compact lookup table that rounds request sizes up to 43 1.1 christos * size classes. In order to reduce cache footprint, the table is compressed, 44 1.1 christos * and all accesses are via sz_size2index(). 45 1.1 christos */ 46 1.1.1.2 christos extern uint8_t sz_size2index_tab[]; 47 1.1 christos 48 1.1.1.2 christos /* 49 1.1.1.2 christos * Padding for large allocations: PAGE when opt_cache_oblivious == true (to 50 1.1.1.2 christos * enable cache index randomization); 0 otherwise. 51 1.1.1.2 christos */ 52 1.1.1.2 christos extern size_t sz_large_pad; 53 1.1.1.2 christos 54 1.1.1.2 christos extern void sz_boot(const sc_data_t *sc_data, bool cache_oblivious); 55 1.1 christos 56 1.1 christos JEMALLOC_ALWAYS_INLINE pszind_t 57 1.1 christos sz_psz2ind(size_t psz) { 58 1.1.1.2 christos assert(psz > 0); 59 1.1.1.2 christos if (unlikely(psz > SC_LARGE_MAXCLASS)) { 60 1.1.1.2 christos return SC_NPSIZES; 61 1.1 christos } 62 1.1.1.2 christos /* x is the lg of the first base >= psz. */ 63 1.1.1.2 christos pszind_t x = lg_ceil(psz); 64 1.1.1.2 christos /* 65 1.1.1.2 christos * sc.h introduces a lot of size classes. These size classes are divided 66 1.1.1.2 christos * into different size class groups. There is a very special size class 67 1.1.1.2 christos * group, each size class in or after it is an integer multiple of PAGE. 68 1.1.1.2 christos * We call it first_ps_rg. It means first page size regular group. The 69 1.1.1.2 christos * range of first_ps_rg is (base, base * 2], and base == PAGE * 70 1.1.1.2 christos * SC_NGROUP. off_to_first_ps_rg begins from 1, instead of 0. e.g. 71 1.1.1.2 christos * off_to_first_ps_rg is 1 when psz is (PAGE * SC_NGROUP + 1). 72 1.1.1.2 christos */ 73 1.1.1.2 christos pszind_t off_to_first_ps_rg = (x < SC_LG_NGROUP + LG_PAGE) ? 74 1.1.1.2 christos 0 : x - (SC_LG_NGROUP + LG_PAGE); 75 1.1 christos 76 1.1.1.2 christos /* 77 1.1.1.2 christos * Same as sc_s::lg_delta. 78 1.1.1.2 christos * Delta for off_to_first_ps_rg == 1 is PAGE, 79 1.1.1.2 christos * for each increase in offset, it's multiplied by two. 80 1.1.1.2 christos * Therefore, lg_delta = LG_PAGE + (off_to_first_ps_rg - 1). 81 1.1.1.2 christos */ 82 1.1.1.2 christos pszind_t lg_delta = (off_to_first_ps_rg == 0) ? 83 1.1.1.2 christos LG_PAGE : LG_PAGE + (off_to_first_ps_rg - 1); 84 1.1 christos 85 1.1.1.2 christos /* 86 1.1.1.2 christos * Let's write psz in binary, e.g. 0011 for 0x3, 0111 for 0x7. 87 1.1.1.2 christos * The leftmost bits whose len is lg_base decide the base of psz. 88 1.1.1.2 christos * The rightmost bits whose len is lg_delta decide (pgz % PAGE). 89 1.1.1.2 christos * The middle bits whose len is SC_LG_NGROUP decide ndelta. 90 1.1.1.2 christos * ndelta is offset to the first size class in the size class group, 91 1.1.1.2 christos * starts from 1. 92 1.1.1.2 christos * If you don't know lg_base, ndelta or lg_delta, see sc.h. 93 1.1.1.2 christos * |xxxxxxxxxxxxxxxxxxxx|------------------------|yyyyyyyyyyyyyyyyyyyyy| 94 1.1.1.2 christos * |<-- len: lg_base -->|<-- len: SC_LG_NGROUP-->|<-- len: lg_delta -->| 95 1.1.1.2 christos * |<-- ndelta -->| 96 1.1.1.2 christos * rg_inner_off = ndelta - 1 97 1.1.1.2 christos * Why use (psz - 1)? 98 1.1.1.2 christos * To handle case: psz % (1 << lg_delta) == 0. 99 1.1.1.2 christos */ 100 1.1.1.2 christos pszind_t rg_inner_off = (((psz - 1)) >> lg_delta) & (SC_NGROUP - 1); 101 1.1 christos 102 1.1.1.2 christos pszind_t base_ind = off_to_first_ps_rg << SC_LG_NGROUP; 103 1.1.1.2 christos pszind_t ind = base_ind + rg_inner_off; 104 1.1.1.2 christos return ind; 105 1.1 christos } 106 1.1 christos 107 1.1 christos static inline size_t 108 1.1 christos sz_pind2sz_compute(pszind_t pind) { 109 1.1.1.2 christos if (unlikely(pind == SC_NPSIZES)) { 110 1.1.1.2 christos return SC_LARGE_MAXCLASS + PAGE; 111 1.1 christos } 112 1.1.1.2 christos size_t grp = pind >> SC_LG_NGROUP; 113 1.1.1.2 christos size_t mod = pind & ((ZU(1) << SC_LG_NGROUP) - 1); 114 1.1 christos 115 1.1.1.2 christos size_t grp_size_mask = ~((!!grp)-1); 116 1.1.1.2 christos size_t grp_size = ((ZU(1) << (LG_PAGE + (SC_LG_NGROUP-1))) << grp) 117 1.1.1.2 christos & grp_size_mask; 118 1.1.1.2 christos 119 1.1.1.2 christos size_t shift = (grp == 0) ? 1 : grp; 120 1.1.1.2 christos size_t lg_delta = shift + (LG_PAGE-1); 121 1.1.1.2 christos size_t mod_size = (mod+1) << lg_delta; 122 1.1 christos 123 1.1.1.2 christos size_t sz = grp_size + mod_size; 124 1.1.1.2 christos return sz; 125 1.1 christos } 126 1.1 christos 127 1.1 christos static inline size_t 128 1.1 christos sz_pind2sz_lookup(pszind_t pind) { 129 1.1 christos size_t ret = (size_t)sz_pind2sz_tab[pind]; 130 1.1 christos assert(ret == sz_pind2sz_compute(pind)); 131 1.1 christos return ret; 132 1.1 christos } 133 1.1 christos 134 1.1 christos static inline size_t 135 1.1 christos sz_pind2sz(pszind_t pind) { 136 1.1.1.2 christos assert(pind < SC_NPSIZES + 1); 137 1.1 christos return sz_pind2sz_lookup(pind); 138 1.1 christos } 139 1.1 christos 140 1.1 christos static inline size_t 141 1.1 christos sz_psz2u(size_t psz) { 142 1.1.1.2 christos if (unlikely(psz > SC_LARGE_MAXCLASS)) { 143 1.1.1.2 christos return SC_LARGE_MAXCLASS + PAGE; 144 1.1 christos } 145 1.1.1.2 christos size_t x = lg_floor((psz<<1)-1); 146 1.1.1.2 christos size_t lg_delta = (x < SC_LG_NGROUP + LG_PAGE + 1) ? 147 1.1.1.2 christos LG_PAGE : x - SC_LG_NGROUP - 1; 148 1.1.1.2 christos size_t delta = ZU(1) << lg_delta; 149 1.1.1.2 christos size_t delta_mask = delta - 1; 150 1.1.1.2 christos size_t usize = (psz + delta_mask) & ~delta_mask; 151 1.1.1.2 christos return usize; 152 1.1 christos } 153 1.1 christos 154 1.1 christos static inline szind_t 155 1.1 christos sz_size2index_compute(size_t size) { 156 1.1.1.2 christos if (unlikely(size > SC_LARGE_MAXCLASS)) { 157 1.1.1.2 christos return SC_NSIZES; 158 1.1 christos } 159 1.1.1.2 christos 160 1.1.1.2 christos if (size == 0) { 161 1.1.1.2 christos return 0; 162 1.1.1.2 christos } 163 1.1.1.2 christos #if (SC_NTINY != 0) 164 1.1.1.2 christos if (size <= (ZU(1) << SC_LG_TINY_MAXCLASS)) { 165 1.1.1.2 christos szind_t lg_tmin = SC_LG_TINY_MAXCLASS - SC_NTINY + 1; 166 1.1 christos szind_t lg_ceil = lg_floor(pow2_ceil_zu(size)); 167 1.1 christos return (lg_ceil < lg_tmin ? 0 : lg_ceil - lg_tmin); 168 1.1 christos } 169 1.1 christos #endif 170 1.1 christos { 171 1.1 christos szind_t x = lg_floor((size<<1)-1); 172 1.1.1.2 christos szind_t shift = (x < SC_LG_NGROUP + LG_QUANTUM) ? 0 : 173 1.1.1.2 christos x - (SC_LG_NGROUP + LG_QUANTUM); 174 1.1.1.2 christos szind_t grp = shift << SC_LG_NGROUP; 175 1.1 christos 176 1.1.1.2 christos szind_t lg_delta = (x < SC_LG_NGROUP + LG_QUANTUM + 1) 177 1.1.1.2 christos ? LG_QUANTUM : x - SC_LG_NGROUP - 1; 178 1.1 christos 179 1.1 christos size_t delta_inverse_mask = ZU(-1) << lg_delta; 180 1.1 christos szind_t mod = ((((size-1) & delta_inverse_mask) >> lg_delta)) & 181 1.1.1.2 christos ((ZU(1) << SC_LG_NGROUP) - 1); 182 1.1 christos 183 1.1.1.2 christos szind_t index = SC_NTINY + grp + mod; 184 1.1 christos return index; 185 1.1 christos } 186 1.1 christos } 187 1.1 christos 188 1.1 christos JEMALLOC_ALWAYS_INLINE szind_t 189 1.1.1.2 christos sz_size2index_lookup_impl(size_t size) { 190 1.1.1.2 christos assert(size <= SC_LOOKUP_MAXCLASS); 191 1.1.1.2 christos return sz_size2index_tab[(size + (ZU(1) << SC_LG_TINY_MIN) - 1) 192 1.1.1.2 christos >> SC_LG_TINY_MIN]; 193 1.1.1.2 christos } 194 1.1.1.2 christos 195 1.1.1.2 christos JEMALLOC_ALWAYS_INLINE szind_t 196 1.1 christos sz_size2index_lookup(size_t size) { 197 1.1.1.2 christos szind_t ret = sz_size2index_lookup_impl(size); 198 1.1.1.2 christos assert(ret == sz_size2index_compute(size)); 199 1.1.1.2 christos return ret; 200 1.1 christos } 201 1.1 christos 202 1.1 christos JEMALLOC_ALWAYS_INLINE szind_t 203 1.1 christos sz_size2index(size_t size) { 204 1.1.1.2 christos if (likely(size <= SC_LOOKUP_MAXCLASS)) { 205 1.1 christos return sz_size2index_lookup(size); 206 1.1 christos } 207 1.1 christos return sz_size2index_compute(size); 208 1.1 christos } 209 1.1 christos 210 1.1 christos static inline size_t 211 1.1 christos sz_index2size_compute(szind_t index) { 212 1.1.1.2 christos #if (SC_NTINY > 0) 213 1.1.1.2 christos if (index < SC_NTINY) { 214 1.1.1.2 christos return (ZU(1) << (SC_LG_TINY_MAXCLASS - SC_NTINY + 1 + index)); 215 1.1 christos } 216 1.1 christos #endif 217 1.1 christos { 218 1.1.1.2 christos size_t reduced_index = index - SC_NTINY; 219 1.1.1.2 christos size_t grp = reduced_index >> SC_LG_NGROUP; 220 1.1.1.2 christos size_t mod = reduced_index & ((ZU(1) << SC_LG_NGROUP) - 221 1.1 christos 1); 222 1.1 christos 223 1.1 christos size_t grp_size_mask = ~((!!grp)-1); 224 1.1 christos size_t grp_size = ((ZU(1) << (LG_QUANTUM + 225 1.1.1.2 christos (SC_LG_NGROUP-1))) << grp) & grp_size_mask; 226 1.1 christos 227 1.1 christos size_t shift = (grp == 0) ? 1 : grp; 228 1.1 christos size_t lg_delta = shift + (LG_QUANTUM-1); 229 1.1 christos size_t mod_size = (mod+1) << lg_delta; 230 1.1 christos 231 1.1 christos size_t usize = grp_size + mod_size; 232 1.1 christos return usize; 233 1.1 christos } 234 1.1 christos } 235 1.1 christos 236 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 237 1.1.1.2 christos sz_index2size_lookup_impl(szind_t index) { 238 1.1.1.2 christos return sz_index2size_tab[index]; 239 1.1.1.2 christos } 240 1.1.1.2 christos 241 1.1.1.2 christos JEMALLOC_ALWAYS_INLINE size_t 242 1.1 christos sz_index2size_lookup(szind_t index) { 243 1.1.1.2 christos size_t ret = sz_index2size_lookup_impl(index); 244 1.1 christos assert(ret == sz_index2size_compute(index)); 245 1.1 christos return ret; 246 1.1 christos } 247 1.1 christos 248 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 249 1.1 christos sz_index2size(szind_t index) { 250 1.1.1.2 christos assert(index < SC_NSIZES); 251 1.1 christos return sz_index2size_lookup(index); 252 1.1 christos } 253 1.1 christos 254 1.1.1.2 christos JEMALLOC_ALWAYS_INLINE void 255 1.1.1.2 christos sz_size2index_usize_fastpath(size_t size, szind_t *ind, size_t *usize) { 256 1.1.1.2 christos *ind = sz_size2index_lookup_impl(size); 257 1.1.1.2 christos *usize = sz_index2size_lookup_impl(*ind); 258 1.1.1.2 christos } 259 1.1.1.2 christos 260 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 261 1.1 christos sz_s2u_compute(size_t size) { 262 1.1.1.2 christos if (unlikely(size > SC_LARGE_MAXCLASS)) { 263 1.1 christos return 0; 264 1.1 christos } 265 1.1.1.2 christos 266 1.1.1.2 christos if (size == 0) { 267 1.1.1.2 christos size++; 268 1.1.1.2 christos } 269 1.1.1.2 christos #if (SC_NTINY > 0) 270 1.1.1.2 christos if (size <= (ZU(1) << SC_LG_TINY_MAXCLASS)) { 271 1.1.1.2 christos size_t lg_tmin = SC_LG_TINY_MAXCLASS - SC_NTINY + 1; 272 1.1 christos size_t lg_ceil = lg_floor(pow2_ceil_zu(size)); 273 1.1 christos return (lg_ceil < lg_tmin ? (ZU(1) << lg_tmin) : 274 1.1 christos (ZU(1) << lg_ceil)); 275 1.1 christos } 276 1.1 christos #endif 277 1.1 christos { 278 1.1 christos size_t x = lg_floor((size<<1)-1); 279 1.1.1.2 christos size_t lg_delta = (x < SC_LG_NGROUP + LG_QUANTUM + 1) 280 1.1.1.2 christos ? LG_QUANTUM : x - SC_LG_NGROUP - 1; 281 1.1 christos size_t delta = ZU(1) << lg_delta; 282 1.1 christos size_t delta_mask = delta - 1; 283 1.1 christos size_t usize = (size + delta_mask) & ~delta_mask; 284 1.1 christos return usize; 285 1.1 christos } 286 1.1 christos } 287 1.1 christos 288 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 289 1.1 christos sz_s2u_lookup(size_t size) { 290 1.1 christos size_t ret = sz_index2size_lookup(sz_size2index_lookup(size)); 291 1.1 christos 292 1.1 christos assert(ret == sz_s2u_compute(size)); 293 1.1 christos return ret; 294 1.1 christos } 295 1.1 christos 296 1.1 christos /* 297 1.1 christos * Compute usable size that would result from allocating an object with the 298 1.1 christos * specified size. 299 1.1 christos */ 300 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 301 1.1 christos sz_s2u(size_t size) { 302 1.1.1.2 christos if (likely(size <= SC_LOOKUP_MAXCLASS)) { 303 1.1 christos return sz_s2u_lookup(size); 304 1.1 christos } 305 1.1 christos return sz_s2u_compute(size); 306 1.1 christos } 307 1.1 christos 308 1.1 christos /* 309 1.1 christos * Compute usable size that would result from allocating an object with the 310 1.1 christos * specified size and alignment. 311 1.1 christos */ 312 1.1 christos JEMALLOC_ALWAYS_INLINE size_t 313 1.1 christos sz_sa2u(size_t size, size_t alignment) { 314 1.1 christos size_t usize; 315 1.1 christos 316 1.1 christos assert(alignment != 0 && ((alignment - 1) & alignment) == 0); 317 1.1 christos 318 1.1 christos /* Try for a small size class. */ 319 1.1.1.2 christos if (size <= SC_SMALL_MAXCLASS && alignment <= PAGE) { 320 1.1 christos /* 321 1.1 christos * Round size up to the nearest multiple of alignment. 322 1.1 christos * 323 1.1 christos * This done, we can take advantage of the fact that for each 324 1.1 christos * small size class, every object is aligned at the smallest 325 1.1 christos * power of two that is non-zero in the base two representation 326 1.1 christos * of the size. For example: 327 1.1 christos * 328 1.1 christos * Size | Base 2 | Minimum alignment 329 1.1 christos * -----+----------+------------------ 330 1.1 christos * 96 | 1100000 | 32 331 1.1 christos * 144 | 10100000 | 32 332 1.1 christos * 192 | 11000000 | 64 333 1.1 christos */ 334 1.1 christos usize = sz_s2u(ALIGNMENT_CEILING(size, alignment)); 335 1.1.1.2 christos if (usize < SC_LARGE_MINCLASS) { 336 1.1 christos return usize; 337 1.1 christos } 338 1.1 christos } 339 1.1 christos 340 1.1 christos /* Large size class. Beware of overflow. */ 341 1.1 christos 342 1.1.1.2 christos if (unlikely(alignment > SC_LARGE_MAXCLASS)) { 343 1.1 christos return 0; 344 1.1 christos } 345 1.1 christos 346 1.1 christos /* Make sure result is a large size class. */ 347 1.1.1.2 christos if (size <= SC_LARGE_MINCLASS) { 348 1.1.1.2 christos usize = SC_LARGE_MINCLASS; 349 1.1 christos } else { 350 1.1 christos usize = sz_s2u(size); 351 1.1 christos if (usize < size) { 352 1.1 christos /* size_t overflow. */ 353 1.1 christos return 0; 354 1.1 christos } 355 1.1 christos } 356 1.1 christos 357 1.1 christos /* 358 1.1 christos * Calculate the multi-page mapping that large_palloc() would need in 359 1.1 christos * order to guarantee the alignment. 360 1.1 christos */ 361 1.1 christos if (usize + sz_large_pad + PAGE_CEILING(alignment) - PAGE < usize) { 362 1.1 christos /* size_t overflow. */ 363 1.1 christos return 0; 364 1.1 christos } 365 1.1 christos return usize; 366 1.1 christos } 367 1.1 christos 368 1.1.1.2 christos size_t sz_psz_quantize_floor(size_t size); 369 1.1.1.2 christos size_t sz_psz_quantize_ceil(size_t size); 370 1.1.1.2 christos 371 1.1 christos #endif /* JEMALLOC_INTERNAL_SIZE_H */ 372