prex/sys/mem/kmem.c - annotate

Return to kmem.c CVS log
Up to [local] / prex / sys / mem
Annotation of prex/sys/mem/kmem.c, Revision 1.1.1.1

1.1       nbrk        1: /*-
                      2:  * Copyright (c) 2005-2006, Kohsuke Ohtani
                      3:  * All rights reserved.
                      4:  *
                      5:  * Redistribution and use in source and binary forms, with or without
                      6:  * modification, are permitted provided that the following conditions
                      7:  * are met:
                      8:  * 1. Redistributions of source code must retain the above copyright
                      9:  *    notice, this list of conditions and the following disclaimer.
                     10:  * 2. Redistributions in binary form must reproduce the above copyright
                     11:  *    notice, this list of conditions and the following disclaimer in the
                     12:  *    documentation and/or other materials provided with the distribution.
                     13:  * 3. Neither the name of the author nor the names of any co-contributors
                     14:  *    may be used to endorse or promote products derived from this software
                     15:  *    without specific prior written permission.
                     16:  *
                     17:  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
                     18:  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
                     19:  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
                     20:  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
                     21:  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
                     22:  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
                     23:  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
                     24:  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
                     25:  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
                     26:  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
                     27:  * SUCH DAMAGE.
                     28:  */
                     29:
                     30: /*
                     31:  * kmem.c - kernel memory allocator
                     32:  */
                     33:
                     34: /*
                     35:  * This is a memory allocator optimized for the low foot print
                     36:  * kernel. It works on top of the underlying page allocator, and
                     37:  * manages more smaller memory than page size. It will divide one
                     38:  * page into two or more blocks, and each page is linked as a
                     39:  * kernel page.
                     40:  *
                     41:  * There are following 3 linked lists to manage used/free blocks.
                     42:  *  1) All pages allocated for the kernel memory are linked.
                     43:  *  2) All blocks divided in the same page are linked.
                     44:  *  3) All free blocks of the same size are linked.
                     45:  *
                     46:  * Currently, it can not handle the memory size exceeding one page.
                     47:  * Instead, a driver can use page_alloc() to allocate larger memory.
                     48:  *
                     49:  * The kmem functions are used by not only the kernel core but
                     50:  * also by the buggy drivers. If such kernel code illegally
                     51:  * writes data in exceeding the allocated area, the system will
                     52:  * crash easily. In order to detect the memory over run, each
                     53:  * free block has a magic ID.
                     54:  */
                     55:
                     56: #include <kernel.h>
                     57: #include <page.h>
                     58: #include <sched.h>
                     59: #include <vm.h>
                     60: #include <kmem.h>
                     61:
                     62: /*
                     63:  * Block header
                     64:  *
                     65:  * All free blocks that have same size are linked each other.
                     66:  * In addition, all free blocks within same page are also linked.
                     67:  */
                     68: struct block_hdr {
                     69:        u_short magic;                  /* magic number */
                     70:        u_short size;                   /* size of this block */
                     71:        struct  list link;              /* link to the free list */
                     72:        struct  block_hdr *pg_next;     /* next block in same page */
                     73: };
                     74:
                     75: /*
                     76:  * Page header
                     77:  *
                     78:  * The page header is placed at the top of each page. This
                     79:  * header is used in order to free the page when there are no
                     80:  * used block left in the page. If nr_alloc value becomes zero,
                     81:  * that page can be removed from kernel page.
                     82:  */
                     83: struct page_hdr {
                     84:        u_short magic;                  /* magic number */
                     85:        u_short nallocs;                /* number of allocated blocks */
                     86:        struct  block_hdr first_blk;    /* first block in this page */
                     87: };
                     88:
                     89: #define ALIGN_SIZE     16
                     90: #define ALIGN_MASK     (ALIGN_SIZE - 1)
                     91: #define ALLOC_ALIGN(n) (((vaddr_t)(n) + ALIGN_MASK) & (vaddr_t)~ALIGN_MASK)
                     92:
                     93: #define BLOCK_MAGIC    0xdead
                     94: #define PAGE_MAGIC     0xbeef
                     95:
                     96: #define BLKHDR_SIZE    (sizeof(struct block_hdr))
                     97: #define PGHDR_SIZE     (sizeof(struct page_hdr))
                     98: #define MAX_ALLOC_SIZE (size_t)(PAGE_SIZE - PGHDR_SIZE)
                     99:
                    100: #define MIN_BLOCK_SIZE (BLKHDR_SIZE + 16)
                    101: #define MAX_BLOCK_SIZE (u_short)(PAGE_SIZE - (PGHDR_SIZE - BLKHDR_SIZE))
                    102:
                    103: /* macro to point the page header from specific address */
                    104: #define PAGE_TOP(n)    (struct page_hdr *) \
                    105:                            ((vaddr_t)(n) & (vaddr_t)~(PAGE_SIZE - 1))
                    106:
                    107: /* index of free block list */
                    108: #define BLKIDX(b)      ((u_int)((b)->size) >> 4)
                    109:
                    110: /* number of free block list */
                    111: #define NR_BLOCK_LIST  (PAGE_SIZE / ALIGN_SIZE)
                    112:
                    113: /**
                    114:  * Array of the head block of free block list.
                    115:  *
                    116:  * The index of array is decided by the size of each block.
                    117:  * All block has the size of the multiple of 16.
                    118:  *
                    119:  * ie. free_blocks[0] = list for 16 byte block
                    120:  *     free_blocks[1] = list for 32 byte block
                    121:  *     free_blocks[2] = list for 48 byte block
                    122:  *         .
                    123:  *         .
                    124:  *     free_blocks[255] = list for 4096 byte block
                    125:  *
                    126:  * Generally, only one list is used to search the free block with
                    127:  * a first fit algorithm. Basically, this allocator also uses a
                    128:  * first fit method. However it uses multiple lists corresponding
                    129:  * to each block size. A search is started from the list of the
                    130:  * requested size. So, it is not necessary to search smaller
                    131:  * block's list wastefully.
                    132:  *
                    133:  * Most of kernel memory allocator is using 2^n as block size.
                    134:  * But, these implementation will throw away much memory that
                    135:  * the block size is not fit. This is not suitable for the
                    136:  * embedded system with low foot print.
                    137:  */
                    138: static struct list free_blocks[NR_BLOCK_LIST];
                    139:
                    140: /*
                    141:  * Find the free block for the specified size.
                    142:  * Returns pointer to free block, or NULL on failure.
                    143:  *
                    144:  * First, it searches from the list of same size. If it does not
                    145:  * exists, then it will search the list of larger one.
                    146:  * It will use the block of smallest size that satisfies the
                    147:  * specified size.
                    148:  */
                    149: static struct block_hdr *
                    150: block_find(size_t size)
                    151: {
                    152:        int i;
                    153:        list_t n;
                    154:
                    155:        for (i = (int)((u_int)size >> 4); i < NR_BLOCK_LIST; i++) {
                    156:                if (!list_empty(&free_blocks[i]))
                    157:                        break;
                    158:        }
                    159:        if (i >= NR_BLOCK_LIST)
                    160:                return NULL;
                    161:
                    162:        n = list_first(&free_blocks[i]);
                    163:        return list_entry(n, struct block_hdr, link);
                    164: }
                    165:
                    166: /*
                    167:  * Allocate memory block for kernel
                    168:  *
                    169:  * This function does not fill the allocated block by 0 for performance.
                    170:  * kmem_alloc() returns NULL on failure.
                    171:  */
                    172: void *
                    173: kmem_alloc(size_t size)
                    174: {
                    175:        struct block_hdr *blk, *newblk;
                    176:        struct page_hdr *pg;
                    177:        void *p;
                    178:
                    179:        ASSERT(irq_level == 0);
                    180:
                    181:        sched_lock();           /* Lock scheduler */
                    182:        /*
                    183:         * First, the free block of enough size is searched
                    184:         * from the page already used. If it does not exist,
                    185:         * new page is allocated for free block.
                    186:         */
                    187:        size = ALLOC_ALIGN(size + BLKHDR_SIZE);
                    188:
                    189:        ASSERT(size && size <= MAX_ALLOC_SIZE);
                    190:
                    191:        blk = block_find(size);
                    192:        if (blk) {
                    193:                /* Block found */
                    194:                list_remove(&blk->link); /* Remove from free list */
                    195:                pg = PAGE_TOP(blk);      /* Get the page address */
                    196:        } else {
                    197:                /* No block found. Allocate new page */
                    198:                if ((pg = page_alloc(PAGE_SIZE)) == NULL) {
                    199:                        sched_unlock();
                    200:                        return NULL;
                    201:                }
                    202:                pg = phys_to_virt(pg);
                    203:                pg->nallocs = 0;
                    204:                pg->magic = PAGE_MAGIC;
                    205:
                    206:                /* Setup first block */
                    207:                blk = &(pg->first_blk);
                    208:                blk->magic = BLOCK_MAGIC;
                    209:                blk->size = MAX_BLOCK_SIZE;
                    210:                blk->pg_next = NULL;
                    211:        }
                    212:        /* Sanity check */
                    213:        if (pg->magic != PAGE_MAGIC || blk->magic != BLOCK_MAGIC)
                    214:                panic("kmem_alloc: overrun");
                    215:        /*
                    216:         * If the found block is large enough, split it.
                    217:         */
                    218:        if (blk->size - size >= MIN_BLOCK_SIZE) {
                    219:                /* Make new block */
                    220:                newblk = (struct block_hdr *)((char *)blk + size);
                    221:                newblk->magic = BLOCK_MAGIC;
                    222:                newblk->size = (u_short)(blk->size - size);
                    223:                list_insert(&free_blocks[BLKIDX(newblk)], &newblk->link);
                    224:
                    225:                /* Update page list */
                    226:                newblk->pg_next = blk->pg_next;
                    227:                blk->pg_next = newblk;
                    228:
                    229:                blk->size = (u_short)size;
                    230:        }
                    231:        /* Increment allocation count of this page */
                    232:        pg->nallocs++;
                    233:        p = (char *)blk + BLKHDR_SIZE;
                    234:        sched_unlock();
                    235:        return p;
                    236: }
                    237:
                    238: /*
                    239:  * Free allocated memory block.
                    240:  *
                    241:  * Some kernel does not release the free page for the kernel memory
                    242:  * because it is needed to allocate immediately later. For example,
                    243:  * it is efficient here if the free page is just linked to the list
                    244:  * of the biggest size. However, consider the case where a driver
                    245:  * requires many small memories temporarily. After these pages are
                    246:  * freed, they can not be reused for an application.
                    247:  */
                    248: void
                    249: kmem_free(void *ptr)
                    250: {
                    251:        struct block_hdr *blk;
                    252:        struct page_hdr *pg;
                    253:
                    254:        ASSERT(irq_level == 0);
                    255:        ASSERT(ptr);
                    256:
                    257:        /* Lock scheduler */
                    258:        sched_lock();
                    259:
                    260:        /* Get the block header */
                    261:        blk = (struct block_hdr *)((char *)ptr - BLKHDR_SIZE);
                    262:        if (blk->magic != BLOCK_MAGIC)
                    263:                panic("kmem_free: invalid address");
                    264:
                    265:        /*
                    266:         * Return the block to free list. Since kernel code will
                    267:         * request fixed size of memory block, we don't merge the
                    268:         * blocks to use it as cache.
                    269:         */
                    270:        list_insert(&free_blocks[BLKIDX(blk)], &blk->link);
                    271:
                    272:        /* Decrement allocation count of this page */
                    273:        pg = PAGE_TOP(blk);
                    274:        if (--pg->nallocs <= 0) {
                    275:                /*
                    276:                 * No allocated block in this page.
                    277:                 * Remove all blocks and deallocate this page.
                    278:                 */
                    279:                for (blk = &(pg->first_blk); blk != NULL; blk = blk->pg_next) {
                    280:                        list_remove(&blk->link); /* Remove from free list */
                    281:                }
                    282:                pg->magic = 0;
                    283:                page_free(virt_to_phys(pg), PAGE_SIZE);
                    284:        }
                    285:        sched_unlock();
                    286: }
                    287:
                    288: /*
                    289:  * Map specified virtual address to the kernel address
                    290:  * Returns kernel address on success, or NULL if no mapped memory.
                    291:  */
                    292: void *
                    293: kmem_map(void *addr, size_t size)
                    294: {
                    295:        void *phys;
                    296:
                    297:        phys = vm_translate(addr, size);
                    298:        if (phys == NULL)
                    299:                return NULL;
                    300:        return phys_to_virt(phys);
                    301: }
                    302:
                    303: void
                    304: kmem_init(void)
                    305: {
                    306:        int i;
                    307:
                    308:        for (i = 0; i < NR_BLOCK_LIST; i++)
                    309:                list_init(&free_blocks[i]);
                    310: }
CVSweb