slabmgr.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 OSCAR lab, Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * slabmgr.h
  17. *
  18. * This file contains implementation of SLAB (variable-size) memory allocator.
  19. */
  20. #ifndef SLABMGR_H
  21. #define SLABMGR_H
  22. #include "linux_list.h"
  23. #include <assert.h>
  24. #include <sys/mman.h>
  25. #ifndef system_malloc
  26. #error "macro \"void * system_malloc(int size)\" not declared"
  27. #endif
  28. #ifndef system_free
  29. #error "macro \"void * system_free(void * ptr, int size)\" not declared"
  30. #endif
  31. #ifndef system_lock
  32. #define system_lock() ({})
  33. #endif
  34. #ifndef system_unlock
  35. #define system_unlock() ({})
  36. #endif
  37. /* malloc is supposed to provide some kind of alignment guarantees, but
  38. * I can't find a specific reference to what that should be for x86_64.
  39. * The first link here is a reference to a technical report from Mozilla,
  40. * which seems to indicate that 64-bit platforms align return values to
  41. * 16-bytes. calloc and malloc provide the same alignment guarantees.
  42. * calloc additionally sets the memory to 0, which malloc is not required
  43. * to do.
  44. *
  45. * http://www.erahm.org/2016/03/24/minimum-alignment-of-allocation-across-platforms/
  46. * http://pubs.opengroup.org/onlinepubs/9699919799/functions/malloc.html
  47. */
  48. #define MIN_MALLOC_ALIGNMENT 16
  49. /* Slab objects need to be a multiple of 16 bytes to ensure proper address
  50. * alignment for malloc and calloc. */
  51. #define OBJ_PADDING 15
  52. #define LARGE_OBJ_PADDING 8
  53. /* Returns the smallest exact multiple of _y that is at least as large as _x.
  54. * In other words, returns _x if _x is a multiple of _y, otherwise rounds
  55. * _x up to be a multiple of _y.
  56. */
  57. #define ROUND_UP(_x, _y) ((((_x) + (_y) - 1) / (_y)) * (_y))
  58. typedef struct __attribute__((packed)) slab_obj {
  59. unsigned char level;
  60. unsigned char padding[OBJ_PADDING];
  61. union {
  62. struct list_head __list;
  63. unsigned char *raw;
  64. };
  65. } SLAB_OBJ_TYPE, * SLAB_OBJ;
  66. /* In order for slab elements to be 16-byte aligned, struct slab_area must
  67. * be a multiple of 16 bytes. TODO: Add compile time assertion that this
  68. * invariant is respected. */
  69. #define AREA_PADDING 12
  70. typedef struct __attribute__((packed)) slab_area {
  71. struct list_head __list;
  72. unsigned int size;
  73. unsigned char pad[AREA_PADDING];
  74. unsigned char raw[];
  75. } SLAB_AREA_TYPE, * SLAB_AREA;
  76. #ifdef SLAB_DEBUG
  77. struct slab_debug {
  78. struct {
  79. const char * file;
  80. int line;
  81. } alloc, free;
  82. };
  83. # define SLAB_DEBUG_SIZE sizeof(struct slab_debug)
  84. #else
  85. # define SLAB_DEBUG_SIZE 0
  86. #endif
  87. #ifdef SLAB_CANARY
  88. # define SLAB_CANARY_STRING 0xDEADBEEF
  89. # define SLAB_CANARY_SIZE sizeof(unsigned long)
  90. #else
  91. # define SLAB_CANARY_SIZE 0
  92. #endif
  93. #define SLAB_HDR_SIZE \
  94. ROUND_UP((sizeof(SLAB_OBJ_TYPE) - sizeof(struct list_head) + \
  95. SLAB_DEBUG_SIZE + SLAB_CANARY_SIZE), \
  96. MIN_MALLOC_ALIGNMENT)
  97. #ifndef SLAB_LEVEL
  98. #define SLAB_LEVEL 8
  99. #endif
  100. #ifndef SLAB_LEVEL_SIZES
  101. # define SLAB_LEVEL_SIZES 16, 32, 64, \
  102. 128 - SLAB_HDR_SIZE, \
  103. 256 - SLAB_HDR_SIZE, \
  104. 512 - SLAB_HDR_SIZE, \
  105. 1024 - SLAB_HDR_SIZE, \
  106. 2048 - SLAB_HDR_SIZE
  107. # define SLAB_LEVELS_SUM (4080 - SLAB_HDR_SIZE * 5)
  108. #else
  109. # ifndef SLAB_LEVELS_SUM
  110. # error "SALB_LEVELS_SUM not defined"
  111. # endif
  112. #endif
  113. static int slab_levels[SLAB_LEVEL] = { SLAB_LEVEL_SIZES };
  114. typedef struct slab_mgr {
  115. struct list_head area_list[SLAB_LEVEL];
  116. struct list_head free_list[SLAB_LEVEL];
  117. unsigned int size[SLAB_LEVEL];
  118. void * addr[SLAB_LEVEL], * addr_top[SLAB_LEVEL];
  119. } SLAB_MGR_TYPE, * SLAB_MGR;
  120. typedef struct __attribute__((packed)) large_mem_obj {
  121. // offset 0
  122. unsigned long size;
  123. unsigned char large_padding[LARGE_OBJ_PADDING];
  124. // offset 16
  125. unsigned char level;
  126. unsigned char padding[OBJ_PADDING];
  127. // offset 32
  128. unsigned char raw[];
  129. } LARGE_MEM_OBJ_TYPE, * LARGE_MEM_OBJ;
  130. #define OBJ_LEVEL(obj) ((obj)->level)
  131. #define OBJ_RAW(obj) (&(obj)->raw)
  132. #define RAW_TO_LEVEL(raw_ptr) \
  133. (*((unsigned char *) (raw_ptr) - OBJ_PADDING - 1))
  134. #define RAW_TO_OBJ(raw_ptr, type) container_of((raw_ptr), type, raw)
  135. #define __SUM_OBJ_SIZE(slab_size, size) \
  136. (((slab_size) + SLAB_HDR_SIZE) * (size))
  137. #define __MIN_MEM_SIZE() (sizeof(SLAB_AREA_TYPE))
  138. #define __MAX_MEM_SIZE(slab_size, size) \
  139. (__MIN_MEM_SIZE() + __SUM_OBJ_SIZE((slab_size), (size)))
  140. #define __INIT_SUM_OBJ_SIZE(size) \
  141. ((SLAB_LEVELS_SUM + SLAB_HDR_SIZE * SLAB_LEVEL) * (size))
  142. #define __INIT_MIN_MEM_SIZE() \
  143. (sizeof(SLAB_MGR_TYPE) + sizeof(SLAB_AREA_TYPE) * SLAB_LEVEL)
  144. #define __INIT_MAX_MEM_SIZE(size) \
  145. (__INIT_MIN_MEM_SIZE() + __INIT_SUM_OBJ_SIZE((size)))
  146. #ifdef PAGE_SIZE
  147. static inline int size_align_down(int slab_size, int size)
  148. {
  149. int s = __MAX_MEM_SIZE(slab_size, size);
  150. int p = s - (s & ~(PAGE_SIZE - 1));
  151. int o = __SUM_OBJ_SIZE(slab_size, 1);
  152. return size - p / o - (p % o ? 1 : 0);
  153. }
  154. static inline int size_align_up(int slab_size, int size)
  155. {
  156. int s = __MAX_MEM_SIZE(slab_size, size);
  157. int p = ((s + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1)) - s;
  158. int o = __SUM_OBJ_SIZE(slab_size, 1);
  159. return size + p / o;
  160. }
  161. static inline int init_align_down(int size)
  162. {
  163. int s = __INIT_MAX_MEM_SIZE(size);
  164. int p = s - (s & ~(PAGE_SIZE - 1));
  165. int o = __INIT_SUM_OBJ_SIZE(1);
  166. return size - p /o - (p % o ? 1 : 0);
  167. }
  168. static inline int init_size_align_up(int size)
  169. {
  170. int s = __INIT_MAX_MEM_SIZE(size);
  171. int p = ((s + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1)) - s;
  172. int o = __INIT_SUM_OBJ_SIZE(1);
  173. return size + p / o;
  174. }
  175. #endif /* PAGE_SIZE */
  176. #ifndef STARTUP_SIZE
  177. # define STARTUP_SIZE 16
  178. #endif
  179. static inline void __set_free_slab_area (SLAB_AREA area, SLAB_MGR mgr,
  180. int level)
  181. {
  182. int slab_size = slab_levels[level] + SLAB_HDR_SIZE;
  183. mgr->addr[level] = (void *) area->raw;
  184. mgr->addr_top[level] = (void *) area->raw + area->size * slab_size;
  185. mgr->size[level] += area->size;
  186. }
  187. static inline SLAB_MGR create_slab_mgr (void)
  188. {
  189. #ifdef PAGE_SIZE
  190. int size = init_size_align_up(STARTUP_SIZE);
  191. #else
  192. int size = STARTUP_SIZE;
  193. #endif
  194. unsigned long mem;
  195. SLAB_AREA area;
  196. SLAB_MGR mgr;
  197. mem = (unsigned long) system_malloc(__INIT_MAX_MEM_SIZE(size));
  198. if (mem <= 0)
  199. return NULL;
  200. mgr = (SLAB_MGR) mem;
  201. void * addr = (void *) mgr + sizeof(SLAB_MGR_TYPE);
  202. int i;
  203. for (i = 0 ; i < SLAB_LEVEL ; i++) {
  204. area = (SLAB_AREA) addr;
  205. area->size = STARTUP_SIZE;
  206. INIT_LIST_HEAD(&area->__list);
  207. INIT_LIST_HEAD(&mgr->area_list[i]);
  208. list_add_tail(&area->__list, &mgr->area_list[i]);
  209. INIT_LIST_HEAD(&mgr->free_list[i]);
  210. mgr->size[i] = 0;
  211. __set_free_slab_area(area, mgr, i);
  212. addr += __MAX_MEM_SIZE(slab_levels[i], STARTUP_SIZE);
  213. }
  214. return mgr;
  215. }
  216. static inline void destroy_slab_mgr (SLAB_MGR mgr)
  217. {
  218. void * addr = (void *) mgr + sizeof(SLAB_MGR_TYPE);
  219. SLAB_AREA area, tmp, n;
  220. int i;
  221. for (i = 0 ; i < SLAB_LEVEL; i++) {
  222. area = (SLAB_AREA) addr;
  223. list_for_each_entry_safe(tmp, n, &mgr->area_list[i], __list) {
  224. if (tmp != area)
  225. system_free(area,
  226. __MAX_MEM_SIZE(slab_levels[i], area->size));
  227. }
  228. addr += __MAX_MEM_SIZE(slab_levels[i], STARTUP_SIZE);
  229. }
  230. system_free(mgr, addr - (void *) mgr);
  231. }
  232. static inline SLAB_MGR enlarge_slab_mgr (SLAB_MGR mgr, int level)
  233. {
  234. SLAB_AREA area;
  235. int size;
  236. if (level >= SLAB_LEVEL) {
  237. system_lock();
  238. goto out;
  239. }
  240. size = mgr->size[level];
  241. area = (SLAB_AREA) system_malloc(__MAX_MEM_SIZE(slab_levels[level], size));
  242. if (area <= 0)
  243. return NULL;
  244. system_lock();
  245. area->size = size;
  246. INIT_LIST_HEAD(&area->__list);
  247. list_add(&area->__list, &mgr->area_list[level]);
  248. __set_free_slab_area(area, mgr, level);
  249. system_unlock();
  250. out:
  251. return mgr;
  252. }
  253. static inline void * slab_alloc (SLAB_MGR mgr, int size)
  254. {
  255. SLAB_OBJ mobj;
  256. int i;
  257. int level = -1;
  258. for (i = 0 ; i < SLAB_LEVEL ; i++)
  259. if (size <= slab_levels[i]) {
  260. level = i;
  261. break;
  262. }
  263. if (level == -1) {
  264. LARGE_MEM_OBJ mem = (LARGE_MEM_OBJ)
  265. system_malloc(sizeof(LARGE_MEM_OBJ_TYPE) + size);
  266. if (!mem)
  267. return NULL;
  268. mem->size = size;
  269. OBJ_LEVEL(mem) = (unsigned char) -1;
  270. return OBJ_RAW(mem);
  271. }
  272. system_lock();
  273. if (mgr->addr[level] == mgr->addr_top[level] &&
  274. list_empty(&mgr->free_list[level])) {
  275. system_unlock();
  276. enlarge_slab_mgr(mgr, level);
  277. system_lock();
  278. }
  279. if (!list_empty(&mgr->free_list[level])) {
  280. mobj = list_first_entry(&mgr->free_list[level], SLAB_OBJ_TYPE, __list);
  281. list_del(&mobj->__list);
  282. } else {
  283. mobj = (void *) mgr->addr[level];
  284. mgr->addr[level] += slab_levels[level] + SLAB_HDR_SIZE;
  285. }
  286. OBJ_LEVEL(mobj) = level;
  287. system_unlock();
  288. #ifdef SLAB_CANARY
  289. unsigned long * m =
  290. (unsigned long *) ((void *) OBJ_RAW(mobj) + slab_levels[level]);
  291. *m = SLAB_CANARY_STRING;
  292. #endif
  293. return OBJ_RAW(mobj);
  294. }
  295. #ifdef SLAB_DEBUG
  296. static inline void * slab_alloc_debug (SLAB_MGR mgr, int size,
  297. const char * file, int line)
  298. {
  299. void * mem = slab_alloc(mgr, size);
  300. int i;
  301. int level = -1;
  302. for (i = 0 ; i < SLAB_LEVEL ; i++)
  303. if (size <= slab_levels[i]) {
  304. level = i;
  305. break;
  306. }
  307. if (level != -1) {
  308. struct slab_debug * debug =
  309. (struct slab_debug *) (mem + slab_levels[level] +
  310. SLAB_CANARY_SIZE);
  311. debug->alloc.file = file;
  312. debug->alloc.line = line;
  313. }
  314. return mem;
  315. }
  316. #endif
  317. static inline void slab_free (SLAB_MGR mgr, void * obj)
  318. {
  319. /* In a general purpose allocator, free of NULL is allowed (and is a
  320. * nop). We might want to enforce stricter rules for our allocator if
  321. * we're sure that no clients rely on being able to free NULL. */
  322. if (obj == NULL)
  323. return;
  324. unsigned char level = RAW_TO_LEVEL(obj);
  325. if (level == (unsigned char) -1) {
  326. LARGE_MEM_OBJ mem = RAW_TO_OBJ(obj, LARGE_MEM_OBJ_TYPE);
  327. system_free(mem, mem->size + sizeof(LARGE_MEM_OBJ_TYPE));
  328. return;
  329. }
  330. /* If this happens, either the heap is already corrupted, or someone's
  331. * freeing something that's wrong, which will most likely lead to heap
  332. * corruption. Either way, panic if this happens. TODO: this doesn't allow
  333. * us to detect cases where the heap headers have been zeroed, which
  334. * is a common type of heap corruption. We could make this case slightly
  335. * more likely to be detected by adding a non-zero offset to the level,
  336. * so a level of 0 in the header would no longer be a valid level. */
  337. if (level >= SLAB_LEVEL) {
  338. pal_printf("Heap corruption detected: invalid heap level %ud\n", level);
  339. assert(0); // panic
  340. }
  341. #ifdef SLAB_CANARY
  342. unsigned long * m = (unsigned long *) (obj + slab_levels[level]);
  343. assert((*m) == SLAB_CANARY_STRING);
  344. #endif
  345. SLAB_OBJ mobj = RAW_TO_OBJ(obj, SLAB_OBJ_TYPE);
  346. system_lock();
  347. INIT_LIST_HEAD(&mobj->__list);
  348. list_add_tail(&mobj->__list, &mgr->free_list[level]);
  349. system_unlock();
  350. }
  351. #ifdef SLAB_DEBUG
  352. static inline void slab_free_debug (SLAB_MGR mgr, void * obj,
  353. const char * file, int line)
  354. {
  355. if (obj == NULL)
  356. return;
  357. unsigned char level = RAW_TO_LEVEL(obj);
  358. if (level < SLAB_LEVEL) {
  359. struct slab_debug * debug =
  360. (struct slab_debug *) (obj + slab_levels[level] +
  361. SLAB_CANARY_SIZE);
  362. debug->free.file = file;
  363. debug->free.line = line;
  364. }
  365. slab_free(mgr, obj);
  366. }
  367. #endif
  368. #endif /* SLABMGR_H */