prex-old/sys/mem/kmem.c - annotate

Return to kmem.c CVS log
Up to [local] / prex-old / sys / mem
Annotation of prex-old/sys/mem/kmem.c, Revision 1.1.1.1

1.1       nbrk        1: /*-
                      2:  * Copyright (c) 2005-2006, Kohsuke Ohtani
                      3:  * All rights reserved.
                      4:  *
                      5:  * Redistribution and use in source and binary forms, with or without
                      6:  * modification, are permitted provided that the following conditions
                      7:  * are met:
                      8:  * 1. Redistributions of source code must retain the above copyright
                      9:  *    notice, this list of conditions and the following disclaimer.
                     10:  * 2. Redistributions in binary form must reproduce the above copyright
                     11:  *    notice, this list of conditions and the following disclaimer in the
                     12:  *    documentation and/or other materials provided with the distribution.
                     13:  * 3. Neither the name of the author nor the names of any co-contributors
                     14:  *    may be used to endorse or promote products derived from this software
                     15:  *    without specific prior written permission.
                     16:  *
                     17:  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
                     18:  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
                     19:  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
                     20:  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
                     21:  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
                     22:  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
                     23:  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
                     24:  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
                     25:  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
                     26:  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
                     27:  * SUCH DAMAGE.
                     28:  */
                     29:
                     30: /*
                     31:  * kmem.c - kernel memory allocator
                     32:  */
                     33:
                     34: /*
                     35:  * This is a memory allocator optimized for the low foot print kernel.
                     36:  * It works on top of the underlying page allocator, and manages more
                     37:  * smaller memory than page size. It will divide one page into two or
                     38:  * more blocks, and each page is linked as a kernel page.
                     39:  *
                     40:  * There are following 3 linked lists to manage used/free blocks.
                     41:  *  1) All pages allocated for the kernel memory are linked.
                     42:  *  2) All blocks divided in the same page are linked.
                     43:  *  3) All free blocks of the same size are linked.
                     44:  *
                     45:  * Currently, it can not handle the memory size exceeding one page.
                     46:  * Instead, a driver can use page_alloc() to allocate larger memory.
                     47:  *
                     48:  * The kmem functions are used by not only the kernel core but also
                     49:  * by the buggy drivers. If such kernel code illegally writes data in
                     50:  * exceeding the allocated area, the system will crash easily. In order
                     51:  * to detect the memory over run, each free block has a magic ID.
                     52:  */
                     53:
                     54: #include <kernel.h>
                     55: #include <page.h>
                     56: #include <sched.h>
                     57: #include <vm.h>
                     58:
                     59: /*
                     60:  * Block header
                     61:  *
                     62:  * All free blocks that have same size are linked each other.
                     63:  * In addition, all free blocks within same page are also linked.
                     64:  */
                     65: struct block_hdr {
                     66:        u_short magic;                  /* magic number */
                     67:        u_short size;                   /* size of this block */
                     68:        struct  list link;              /* link to the free list */
                     69:        struct  block_hdr *pg_next;     /* next block in same page */
                     70: };
                     71:
                     72: /*
                     73:  * Page header
                     74:  *
                     75:  * The page header is placed at the top of each page.  This header is
                     76:  * used in order to free the page when there are no used block left in
                     77:  * the page. If nr_alloc value becomes zero, that page can be removed
                     78:  * from kernel page.
                     79:  */
                     80: struct page_hdr {
                     81:        u_short magic;                  /* magic number */
                     82:        u_short nallocs;                /* number of allocated blocks */
                     83:        struct  block_hdr first_blk;    /* first block in this page */
                     84: };
                     85:
                     86: #define ALIGN_SIZE     16
                     87: #define ALIGN_MASK     (ALIGN_SIZE - 1)
                     88: #define ALLOC_ALIGN(n) (((n) + ALIGN_MASK) & ~ALIGN_MASK)
                     89:
                     90: #define BLOCK_MAGIC    0xdead
                     91: #define PAGE_MAGIC     0xbeef
                     92:
                     93: #define BLKHDR_SIZE    (sizeof(struct block_hdr))
                     94: #define PGHDR_SIZE     (sizeof(struct page_hdr))
                     95: #define MAX_ALLOC_SIZE (PAGE_SIZE - PGHDR_SIZE)
                     96:
                     97: #define MIN_BLOCK_SIZE (BLKHDR_SIZE + 16)
                     98: #define MAX_BLOCK_SIZE (u_short)(PAGE_SIZE - (PGHDR_SIZE - BLKHDR_SIZE))
                     99:
                    100: /* macro to point the page header from specific address */
                    101: #define PAGE_TOP(n)    (struct page_hdr *) \
                    102:                                    ((u_long)(n) & ~(PAGE_SIZE - 1))
                    103:
                    104: /* index of free block list */
                    105: #define BLKIDX(b)      ((int)((b)->size) >> 4)
                    106:
                    107: /* number of free block list */
                    108: #define NR_BLOCK_LIST  (PAGE_SIZE / ALIGN_SIZE)
                    109:
                    110: /**
                    111:  * Array of the head block of free block list.
                    112:  *
                    113:  * The index of array is decided by the size of each block.
                    114:  * All block has the size of the multiple of 16.
                    115:  *
                    116:  * ie. free_blocks[0] = list for 16 byte block
                    117:  *     free_blocks[1] = list for 32 byte block
                    118:  *     free_blocks[2] = list for 48 byte block
                    119:  *         .
                    120:  *         .
                    121:  *     free_blocks[255] = list for 4096 byte block
                    122:  *
                    123:  * Generally, only one list is used to search the free block with
                    124:  * a first fit algorithm. Basically, this allocator also uses a first
                    125:  * fit method. However it uses multiple lists corresponding to each
                    126:  * block size.
                    127:  * A search is started from the list of the requested size. So, it is
                    128:  * not necessary to search smaller block's list wastefully.
                    129:  *
                    130:  * Most of kernel memory allocator is using 2^n as block size. But,
                    131:  * these implementation will throw away much memory that the block
                    132:  * size is not fit. This is not suitable for the embedded system with
                    133:  * low foot print.
                    134:  */
                    135: static struct list free_blocks[NR_BLOCK_LIST];
                    136:
                    137: static int kmem_bytes;         /* number of bytes currently allocated */
                    138:
                    139: #ifdef DEBUG
                    140: /*
                    141:  * profiling data
                    142:  */
                    143: static int nr_pages;                   /* number of pages currently used */
                    144: static int nr_blocks[NR_BLOCK_LIST];   /* number of blocks currently used */
                    145:
                    146: #endif /* DEBUG */
                    147:
                    148: /*
                    149:  * Find the free block for the specified size.
                    150:  * Returns pointer to free block, or NULL on failure.
                    151:  *
                    152:  * First, it searches from the list of same size. If it does not
                    153:  * exists, then it will search the list of larger one.
                    154:  * It will use the block of smallest size that satisfies the
                    155:  * specified size.
                    156:  */
                    157: static struct block_hdr *
                    158: block_find(size_t size)
                    159: {
                    160:        int i;
                    161:        list_t n;
                    162:
                    163:        for (i = (int)size >> 4; i < NR_BLOCK_LIST; i++) {
                    164:                if (!list_empty(&free_blocks[i]))
                    165:                        break;
                    166:        }
                    167:        if (i >= NR_BLOCK_LIST)
                    168:                return NULL;
                    169:
                    170:        n = list_first(&free_blocks[i]);
                    171:        return list_entry(n, struct block_hdr, link);
                    172: }
                    173:
                    174: /*
                    175:  * Allocate memory block for kernel
                    176:  *
                    177:  * This function does not fill the allocated block by 0 for performance.
                    178:  * kmem_alloc() returns NULL on failure.
                    179:  */
                    180: void *
                    181: kmem_alloc(size_t size)
                    182: {
                    183:        struct block_hdr *blk, *new_blk;
                    184:        struct page_hdr *pg;
                    185:        void *p;
                    186:
                    187:        ASSERT(irq_level == 0);
                    188:
                    189:        sched_lock();           /* Lock scheduler */
                    190:        /*
                    191:         * First, the free block of enough size is searched
                    192:         * from the page already used. If it does not exist,
                    193:         * new page is allocated for free block.
                    194:         */
                    195:        size = ALLOC_ALIGN(size + BLKHDR_SIZE);
                    196:
                    197:        ASSERT(size && size <= MAX_ALLOC_SIZE);
                    198:
                    199:        blk = block_find(size);
                    200:        if (blk) {
                    201:                /* Block found */
                    202:                list_remove(&blk->link); /* Remove from free list */
                    203:                pg = PAGE_TOP(blk);      /* Get the page address */
                    204:        } else {
                    205:                /* No block found. Allocate new page */
                    206:                if ((pg = page_alloc(PAGE_SIZE)) == NULL) {
                    207:                        sched_unlock();
                    208:                        return NULL;
                    209:                }
                    210:                pg = phys_to_virt(pg);
                    211:                pg->nallocs = 0;
                    212:                pg->magic = PAGE_MAGIC;
                    213:
                    214:                /* Setup first block */
                    215:                blk = &(pg->first_blk);
                    216:                blk->magic = BLOCK_MAGIC;
                    217:                blk->size = MAX_BLOCK_SIZE;
                    218:                blk->pg_next = NULL;
                    219: #ifdef DEBUG
                    220:                nr_pages++;
                    221: #endif
                    222:        }
                    223:        /* Sanity check */
                    224:        if (pg->magic != PAGE_MAGIC || blk->magic != BLOCK_MAGIC)
                    225:                panic("kmem overrun: addr=%x", blk);
                    226:        /*
                    227:         * If the found block is large enough, split it.
                    228:         */
                    229:        if (blk->size - size >= MIN_BLOCK_SIZE) {
                    230:                /* Make new block */
                    231:                new_blk = (struct block_hdr *)((u_long)blk + size);
                    232:                new_blk->magic = BLOCK_MAGIC;
                    233:                new_blk->size = (u_short)(blk->size - size);
                    234:                list_insert(&free_blocks[BLKIDX(new_blk)], &new_blk->link);
                    235:
                    236:                /* Update page list */
                    237:                new_blk->pg_next = blk->pg_next;
                    238:                blk->pg_next = new_blk;
                    239:
                    240:                blk->size = (u_short)size;
                    241:        }
                    242:        /* Increment allocation count of this page */
                    243:        pg->nallocs++;
                    244:        kmem_bytes += blk->size;
                    245: #ifdef DEBUG
                    246:        nr_blocks[BLKIDX(blk)]++;
                    247: #endif
                    248:        p = (void *)((u_long)blk + BLKHDR_SIZE);
                    249:        sched_unlock();
                    250:        return p;
                    251: }
                    252:
                    253: /*
                    254:  * Free allocated memory block.
                    255:  *
                    256:  * Some kernel does not release the free page for the kernel memory
                    257:  * because it is needed to allocate immediately later. For example,
                    258:  * it is efficient here if the free page is just linked to the list
                    259:  * of the biggest size. However, consider the case where a driver
                    260:  * requires many small memories temporarily. After these pages are
                    261:  * freed, they can not be reused for an application.
                    262:  */
                    263: void
                    264: kmem_free(void *ptr)
                    265: {
                    266:        struct block_hdr *blk;
                    267:        struct page_hdr *pg;
                    268:
                    269:        ASSERT(irq_level == 0);
                    270:        ASSERT(ptr);
                    271:
                    272:        /* Lock scheduler */
                    273:        sched_lock();
                    274:
                    275:        /* Get the block header */
                    276:        blk = (struct block_hdr *)((u_long)ptr - BLKHDR_SIZE);
                    277:        if (blk->magic != BLOCK_MAGIC)
                    278:                panic("kmem_free");
                    279:
                    280:        kmem_bytes -= blk->size;
                    281:
                    282: #ifdef DEBUG
                    283:        nr_blocks[BLKIDX(blk)]--;
                    284: #endif
                    285:        /*
                    286:         * Return the block to free list.
                    287:         * Since kernel code will request fixed size of memory block,
                    288:         * we don't merge the blocks to use it as cache.
                    289:         */
                    290:        list_insert(&free_blocks[BLKIDX(blk)], &blk->link);
                    291:
                    292:        /* Decrement allocation count of this page */
                    293:        pg = PAGE_TOP(blk);
                    294:        if (--pg->nallocs <= 0) {
                    295:                /*
                    296:                 * No allocated block in this page.
                    297:                 * Remove all blocks and deallocate this page.
                    298:                 */
                    299:                for (blk = &(pg->first_blk); blk != NULL; blk = blk->pg_next) {
                    300:                        list_remove(&blk->link); /* Remove from free list */
                    301: #ifdef DEBUG
                    302:                        nr_blocks[BLKIDX(blk)]--;
                    303: #endif
                    304:                }
                    305:                pg->magic = 0;
                    306:                page_free(virt_to_phys(pg), PAGE_SIZE);
                    307: #ifdef DEBUG
                    308:                nr_pages--;
                    309: #endif
                    310:        }
                    311:        sched_unlock();
                    312: }
                    313:
                    314: /*
                    315:  * Map specified virtual address to the kernel address
                    316:  * Returns kernel address on success, or NULL if no mapped memory.
                    317:  */
                    318: void *
                    319: kmem_map(void *addr, size_t size)
                    320: {
                    321:        void *phys;
                    322:
                    323:        phys = vm_translate(addr, size);
                    324:        if (phys == NULL)
                    325:                return NULL;
                    326:        return phys_to_virt(phys);
                    327: }
                    328:
                    329: void
                    330: kmem_info(size_t *size)
                    331: {
                    332:
                    333:        *size = (size_t)kmem_bytes;
                    334: }
                    335:
                    336: #if defined(DEBUG) && defined(CONFIG_KDUMP)
                    337: void
                    338: kmem_dump(void)
                    339: {
                    340:        list_t head, n;
                    341:        int i, cnt;
                    342:        struct block_hdr *blk;
                    343:
                    344:        printk("\nKernel memory dump:\n");
                    345:
                    346:        printk(" allocated blocks:\n");
                    347:        printk(" block size count\n");
                    348:        printk(" ---------- --------\n");
                    349:
                    350:        for (i = 0; i < NR_BLOCK_LIST; i++) {
                    351:                if (nr_blocks[i])
                    352:                        printk("       %4d %8d\n", i << 4, nr_blocks[i]);
                    353:        }
                    354:        printk("\n free blocks:\n");
                    355:        printk(" block size count\n");
                    356:        printk(" ---------- --------\n");
                    357:
                    358:        for (i = 0; i < NR_BLOCK_LIST; i++) {
                    359:                cnt = 0;
                    360:                head = &free_blocks[i];
                    361:                for (n = list_first(head); n != head; n = list_next(n)) {
                    362:                        cnt++;
                    363:
                    364:                        blk = list_entry(n, struct block_hdr, link);
                    365:                }
                    366:                if (cnt > 0)
                    367:                        printk("       %4d %8d\n", i << 4, cnt);
                    368:        }
                    369:        printk(" Total: page=%d (%dKbyte) alloc=%dbyte unused=%dbyte\n",
                    370:             nr_pages, nr_pages * 4, kmem_bytes,
                    371:             nr_pages * PAGE_SIZE - kmem_bytes);
                    372: }
                    373: #endif
                    374:
                    375: void
                    376: kmem_init(void)
                    377: {
                    378:        int i;
                    379:
                    380:        for (i = 0; i < NR_BLOCK_LIST; i++)
                    381:                list_init(&free_blocks[i]);
                    382: }
CVSweb