Annotation of XNU/bsd/ufs/ffs/ffs_alloc.c, revision 1.1.1.1

1.1       root        1: /*
                      2:  * Copyright (c) 2000 Apple Computer, Inc. All rights reserved.
                      3:  *
                      4:  * @APPLE_LICENSE_HEADER_START@
                      5:  * 
                      6:  * The contents of this file constitute Original Code as defined in and
                      7:  * are subject to the Apple Public Source License Version 1.1 (the
                      8:  * "License").  You may not use this file except in compliance with the
                      9:  * License.  Please obtain a copy of the License at
                     10:  * http://www.apple.com/publicsource and read it before using this file.
                     11:  * 
                     12:  * This Original Code and all software distributed under the License are
                     13:  * distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, EITHER
                     14:  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
                     15:  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
                     16:  * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT.  Please see the
                     17:  * License for the specific language governing rights and limitations
                     18:  * under the License.
                     19:  * 
                     20:  * @APPLE_LICENSE_HEADER_END@
                     21:  */
                     22: /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
                     23: /*
                     24:  * Copyright (c) 1982, 1986, 1989, 1993
                     25:  *     The Regents of the University of California.  All rights reserved.
                     26:  *
                     27:  * Redistribution and use in source and binary forms, with or without
                     28:  * modification, are permitted provided that the following conditions
                     29:  * are met:
                     30:  * 1. Redistributions of source code must retain the above copyright
                     31:  *    notice, this list of conditions and the following disclaimer.
                     32:  * 2. Redistributions in binary form must reproduce the above copyright
                     33:  *    notice, this list of conditions and the following disclaimer in the
                     34:  *    documentation and/or other materials provided with the distribution.
                     35:  * 3. All advertising materials mentioning features or use of this software
                     36:  *    must display the following acknowledgement:
                     37:  *     This product includes software developed by the University of
                     38:  *     California, Berkeley and its contributors.
                     39:  * 4. Neither the name of the University nor the names of its contributors
                     40:  *    may be used to endorse or promote products derived from this software
                     41:  *    without specific prior written permission.
                     42:  *
                     43:  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
                     44:  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
                     45:  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
                     46:  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
                     47:  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
                     48:  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
                     49:  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
                     50:  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
                     51:  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
                     52:  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
                     53:  * SUCH DAMAGE.
                     54:  *
                     55:  *     @(#)ffs_alloc.c 8.18 (Berkeley) 5/26/95
                     56:  */
                     57: #include <rev_endian_fs.h>
                     58: #include <vm/vm_pager.h>
                     59: #include <vm/vnode_pager.h>
                     60: 
                     61: #include <sys/param.h>
                     62: #include <sys/systm.h>
                     63: #include <sys/buf.h>
                     64: #include <sys/proc.h>
                     65: #include <sys/vnode.h>
                     66: #include <sys/mount.h>
                     67: #include <sys/kernel.h>
                     68: #include <sys/syslog.h>
                     69: 
                     70: #include <sys/vm.h>
                     71: 
                     72: #include <ufs/ufs/quota.h>
                     73: #include <ufs/ufs/inode.h>
                     74: 
                     75: #include <ufs/ffs/fs.h>
                     76: #include <ufs/ffs/ffs_extern.h>
                     77: 
                     78: #if REV_ENDIAN_FS
                     79: #include <ufs/ufs/ufs_byte_order.h>
                     80: #include <architecture/byte_order.h>
                     81: #endif /* REV_ENDIAN_FS */
                     82: 
                     83: extern u_long nextgennumber;
                     84: 
                     85: static ufs_daddr_t ffs_alloccg __P((struct inode *, int, ufs_daddr_t, int));
                     86: static ufs_daddr_t ffs_alloccgblk __P((struct fs *, struct cg *, ufs_daddr_t));
                     87: static ufs_daddr_t ffs_clusteralloc __P((struct inode *, int, ufs_daddr_t,
                     88:            int));
                     89: static ino_t   ffs_dirpref __P((struct fs *));
                     90: static ufs_daddr_t ffs_fragextend __P((struct inode *, int, long, int, int));
                     91: static void    ffs_fserr __P((struct fs *, u_int, char *));
                     92: static u_long  ffs_hashalloc
                     93:                    __P((struct inode *, int, long, int, u_int32_t (*)()));
                     94: static ino_t   ffs_nodealloccg __P((struct inode *, int, ufs_daddr_t, int));
                     95: static ufs_daddr_t ffs_mapsearch __P((struct fs *, struct cg *, ufs_daddr_t,
                     96:            int));
                     97: 
                     98: /*
                     99:  * Allocate a block in the file system.
                    100:  * 
                    101:  * The size of the requested block is given, which must be some
                    102:  * multiple of fs_fsize and <= fs_bsize.
                    103:  * A preference may be optionally specified. If a preference is given
                    104:  * the following hierarchy is used to allocate a block:
                    105:  *   1) allocate the requested block.
                    106:  *   2) allocate a rotationally optimal block in the same cylinder.
                    107:  *   3) allocate a block in the same cylinder group.
                    108:  *   4) quadradically rehash into other cylinder groups, until an
                    109:  *      available block is located.
                    110:  * If no block preference is given the following heirarchy is used
                    111:  * to allocate a block:
                    112:  *   1) allocate a block in the cylinder group that contains the
                    113:  *      inode for the file.
                    114:  *   2) quadradically rehash into other cylinder groups, until an
                    115:  *      available block is located.
                    116:  */
                    117: ffs_alloc(ip, lbn, bpref, size, cred, bnp)
                    118:        register struct inode *ip;
                    119:        ufs_daddr_t lbn, bpref;
                    120:        int size;
                    121:        struct ucred *cred;
                    122:        ufs_daddr_t *bnp;
                    123: {
                    124:        register struct fs *fs;
                    125:        ufs_daddr_t bno;
                    126:        int cg, error;
                    127: #if NeXT
                    128:        int devBlockSize=0;
                    129: #endif /* NeXT */
                    130:        *bnp = 0;
                    131:        fs = ip->i_fs;
                    132: #if DIAGNOSTIC
                    133:        if ((u_int)size > fs->fs_bsize || fragoff(fs, size) != 0) {
                    134:                printf("dev = 0x%x, bsize = %d, size = %d, fs = %s\n",
                    135:                    ip->i_dev, fs->fs_bsize, size, fs->fs_fsmnt);
                    136:                panic("ffs_alloc: bad size");
                    137:        }
                    138:        if (cred == NOCRED)
                    139:                panic("ffs_alloc: missing credential\n");
                    140: #endif /* DIAGNOSTIC */
                    141:        if (size == fs->fs_bsize && fs->fs_cstotal.cs_nbfree == 0)
                    142:                goto nospace;
                    143:        if (cred->cr_uid != 0 && freespace(fs, fs->fs_minfree) <= 0)
                    144:                goto nospace;
                    145: #ifdef NeXT
                    146:        VOP_DEVBLOCKSIZE(ip->i_devvp,&devBlockSize);
                    147: #endif /* NeXT */
                    148: #if QUOTA
                    149: #ifdef NeXT
                    150:         if (error = chkdq(ip, (long)btodb(size, devBlockSize), cred, 0))
                    151: #else
                    152:        if (error = chkdq(ip, (long)btodb(size), cred, 0))
                    153: #endif /* NeXT */
                    154:                return (error);
                    155: #endif /* QUOTA */
                    156:        if (bpref >= fs->fs_size)
                    157:                bpref = 0;
                    158:        if (bpref == 0)
                    159:                cg = ino_to_cg(fs, ip->i_number);
                    160:        else
                    161:                cg = dtog(fs, bpref);
                    162:        bno = (ufs_daddr_t)ffs_hashalloc(ip, cg, (long)bpref, size,
                    163:            (u_int32_t (*)())ffs_alloccg);
                    164:        if (bno > 0) {
                    165: #ifdef NeXT
                    166:                ip->i_blocks += btodb(size, devBlockSize);
                    167: #else
                    168:                ip->i_blocks += btodb(size);
                    169: #endif /* NeXT */
                    170:                ip->i_flag |= IN_CHANGE | IN_UPDATE;
                    171:                *bnp = bno;
                    172:                return (0);
                    173:        }
                    174: #if QUOTA
                    175:        /*
                    176:         * Restore user's disk quota because allocation failed.
                    177:         */
                    178: #ifdef NeXT
                    179:        (void) chkdq(ip, (long)-btodb(size, devBlockSize), cred, FORCE);
                    180: #else
                    181:        (void) chkdq(ip, (long)-btodb(size), cred, FORCE);
                    182: #endif /* NeXT */
                    183: #endif /* QUOTA */
                    184: nospace:
                    185:        ffs_fserr(fs, cred->cr_uid, "file system full");
                    186:        uprintf("\n%s: write failed, file system is full\n", fs->fs_fsmnt);
                    187:        return (ENOSPC);
                    188: }
                    189: 
                    190: /*
                    191:  * Reallocate a fragment to a bigger size
                    192:  *
                    193:  * The number and size of the old block is given, and a preference
                    194:  * and new size is also specified. The allocator attempts to extend
                    195:  * the original block. Failing that, the regular block allocator is
                    196:  * invoked to get an appropriate block.
                    197:  */
                    198: ffs_realloccg(ip, lbprev, bpref, osize, nsize, cred, bpp)
                    199:        register struct inode *ip;
                    200:        ufs_daddr_t lbprev;
                    201:        ufs_daddr_t bpref;
                    202:        int osize, nsize;
                    203:        struct ucred *cred;
                    204:        struct buf **bpp;
                    205: {
                    206:        register struct fs *fs;
                    207:        struct buf *bp;
                    208:        int cg, request, error;
                    209:        ufs_daddr_t bprev, bno;
                    210: #ifdef NeXT
                    211:        int devBlockSize=0;
                    212: #endif
                    213:        
                    214:        *bpp = 0;
                    215:        fs = ip->i_fs;
                    216: #if DIAGNOSTIC
                    217:        if ((u_int)osize > fs->fs_bsize || fragoff(fs, osize) != 0 ||
                    218:            (u_int)nsize > fs->fs_bsize || fragoff(fs, nsize) != 0) {
                    219:                printf(
                    220:                    "dev = 0x%x, bsize = %d, osize = %d, nsize = %d, fs = %s\n",
                    221:                    ip->i_dev, fs->fs_bsize, osize, nsize, fs->fs_fsmnt);
                    222:                panic("ffs_realloccg: bad size");
                    223:        }
                    224:        if (cred == NOCRED)
                    225:                panic("ffs_realloccg: missing credential\n");
                    226: #endif /* DIAGNOSTIC */
                    227:        if (cred->cr_uid != 0 && freespace(fs, fs->fs_minfree) <= 0)
                    228:                goto nospace;
                    229:        if ((bprev = ip->i_db[lbprev]) == 0) {
                    230:                printf("dev = 0x%x, bsize = %d, bprev = %d, fs = %s\n",
                    231:                    ip->i_dev, fs->fs_bsize, bprev, fs->fs_fsmnt);
                    232:                panic("ffs_realloccg: bad bprev");
                    233:        }
                    234:        /*
                    235:         * Allocate the extra space in the buffer.
                    236:         */
                    237:        if (error = bread(ITOV(ip), lbprev, osize, NOCRED, &bp)) {
                    238:                brelse(bp);
                    239:                return (error);
                    240:        }
                    241: #ifdef NeXT
                    242:        VOP_DEVBLOCKSIZE(ip->i_devvp,&devBlockSize);
                    243: #endif /* NeXT */
                    244: 
                    245: #if QUOTA
                    246: #ifdef NeXT
                    247:        if (error = chkdq(ip, (long)btodb(nsize - osize, devBlockSize), cred, 0))
                    248: #else
                    249:        if (error = chkdq(ip, (long)btodb(nsize - osize), cred, 0))
                    250: #endif /* NeXT */
                    251:        {
                    252:                brelse(bp);
                    253:                return (error);
                    254:        }
                    255: #endif /* QUOTA */
                    256:        /*
                    257:         * Check for extension in the existing location.
                    258:         */
                    259:        cg = dtog(fs, bprev);
                    260:        if (bno = ffs_fragextend(ip, cg, (long)bprev, osize, nsize)) {
                    261:                if (bp->b_blkno != fsbtodb(fs, bno))
                    262:                        panic("bad blockno");
                    263: #ifdef NeXT
                    264:                ip->i_blocks += btodb(nsize - osize, devBlockSize);
                    265: #else
                    266:                ip->i_blocks += btodb(nsize - osize);
                    267: #endif /* NeXT */
                    268:                ip->i_flag |= IN_CHANGE | IN_UPDATE;
                    269:                allocbuf(bp, nsize);
                    270:                bp->b_flags |= B_DONE;
                    271:                bzero((char *)bp->b_data + osize, (u_int)nsize - osize);
                    272:                *bpp = bp;
                    273:                return (0);
                    274:        }
                    275:        /*
                    276:         * Allocate a new disk location.
                    277:         */
                    278:        if (bpref >= fs->fs_size)
                    279:                bpref = 0;
                    280:        switch ((int)fs->fs_optim) {
                    281:        case FS_OPTSPACE:
                    282:                /*
                    283:                 * Allocate an exact sized fragment. Although this makes 
                    284:                 * best use of space, we will waste time relocating it if 
                    285:                 * the file continues to grow. If the fragmentation is
                    286:                 * less than half of the minimum free reserve, we choose
                    287:                 * to begin optimizing for time.
                    288:                 */
                    289:                request = nsize;
                    290:                if (fs->fs_minfree < 5 ||
                    291:                    fs->fs_cstotal.cs_nffree >
                    292:                    fs->fs_dsize * fs->fs_minfree / (2 * 100))
                    293:                        break;
                    294:                log(LOG_NOTICE, "%s: optimization changed from SPACE to TIME\n",
                    295:                        fs->fs_fsmnt);
                    296:                fs->fs_optim = FS_OPTTIME;
                    297:                break;
                    298:        case FS_OPTTIME:
                    299:                /*
                    300:                 * At this point we have discovered a file that is trying to
                    301:                 * grow a small fragment to a larger fragment. To save time,
                    302:                 * we allocate a full sized block, then free the unused portion.
                    303:                 * If the file continues to grow, the `ffs_fragextend' call
                    304:                 * above will be able to grow it in place without further
                    305:                 * copying. If aberrant programs cause disk fragmentation to
                    306:                 * grow within 2% of the free reserve, we choose to begin
                    307:                 * optimizing for space.
                    308:                 */
                    309:                request = fs->fs_bsize;
                    310:                if (fs->fs_cstotal.cs_nffree <
                    311:                    fs->fs_dsize * (fs->fs_minfree - 2) / 100)
                    312:                        break;
                    313:                log(LOG_NOTICE, "%s: optimization changed from TIME to SPACE\n",
                    314:                        fs->fs_fsmnt);
                    315:                fs->fs_optim = FS_OPTSPACE;
                    316:                break;
                    317:        default:
                    318:                printf("dev = 0x%x, optim = %d, fs = %s\n",
                    319:                    ip->i_dev, fs->fs_optim, fs->fs_fsmnt);
                    320:                panic("ffs_realloccg: bad optim");
                    321:                /* NOTREACHED */
                    322:        }
                    323:        bno = (ufs_daddr_t)ffs_hashalloc(ip, cg, (long)bpref, request,
                    324:            (u_int32_t (*)())ffs_alloccg);
                    325:        if (bno > 0) {
                    326:                bp->b_blkno = fsbtodb(fs, bno);
                    327: #if MACH
                    328:                if (ITOV(ip)->v_vm_info != 0)
                    329:                        (void) vnode_uncache(ITOV(ip));
                    330: #endif
                    331:                ffs_blkfree(ip, bprev, (long)osize);
                    332:                if (nsize < request)
                    333:                        ffs_blkfree(ip, bno + numfrags(fs, nsize),
                    334:                            (long)(request - nsize));
                    335: #ifdef NeXT
                    336:                ip->i_blocks += btodb(nsize - osize, devBlockSize);
                    337: #else
                    338:                ip->i_blocks += btodb(nsize - osize);
                    339: #endif /* NeXT */
                    340:                ip->i_flag |= IN_CHANGE | IN_UPDATE;
                    341:                allocbuf(bp, nsize);
                    342:                bp->b_flags |= B_DONE;
                    343:                bzero((char *)bp->b_data + osize, (u_int)nsize - osize);
                    344:                *bpp = bp;
                    345:                return (0);
                    346:        }
                    347: #if QUOTA
                    348:        /*
                    349:         * Restore user's disk quota because allocation failed.
                    350:         */
                    351: #ifdef NeXT
                    352:        (void) chkdq(ip, (long)-btodb(nsize - osize, devBlockSize), cred, FORCE);
                    353: #else
                    354:        (void) chkdq(ip, (long)-btodb(nsize - osize), cred, FORCE);
                    355: #endif /* NeXT */
                    356: #endif /* QUOTA */
                    357:        brelse(bp);
                    358: nospace:
                    359:        /*
                    360:         * no space available
                    361:         */
                    362:        ffs_fserr(fs, cred->cr_uid, "file system full");
                    363:        uprintf("\n%s: write failed, file system is full\n", fs->fs_fsmnt);
                    364:        return (ENOSPC);
                    365: }
                    366: 
                    367: /*
                    368:  * Reallocate a sequence of blocks into a contiguous sequence of blocks.
                    369:  *
                    370:  * The vnode and an array of buffer pointers for a range of sequential
                    371:  * logical blocks to be made contiguous is given. The allocator attempts
                    372:  * to find a range of sequential blocks starting as close as possible to
                    373:  * an fs_rotdelay offset from the end of the allocation for the logical
                    374:  * block immediately preceeding the current range. If successful, the
                    375:  * physical block numbers in the buffer pointers and in the inode are
                    376:  * changed to reflect the new allocation. If unsuccessful, the allocation
                    377:  * is left unchanged. The success in doing the reallocation is returned.
                    378:  * Note that the error return is not reflected back to the user. Rather
                    379:  * the previous block allocation will be used.
                    380:  */
                    381: int doasyncfree = 1;
                    382: int doreallocblks = 1;
                    383: int prtrealloc = 0;
                    384: 
                    385: int
                    386: ffs_reallocblks(ap)
                    387:        struct vop_reallocblks_args /* {
                    388:                struct vnode *a_vp;
                    389:                struct cluster_save *a_buflist;
                    390:        } */ *ap;
                    391: {
                    392:        struct fs *fs;
                    393:        struct inode *ip;
                    394:        struct vnode *vp;
                    395:        struct buf *sbp, *ebp;
                    396:        ufs_daddr_t *bap, *sbap, *ebap;
                    397:        struct cluster_save *buflist;
                    398:        ufs_daddr_t start_lbn, end_lbn, soff, eoff, newblk, blkno;
                    399:        struct indir start_ap[NIADDR + 1], end_ap[NIADDR + 1], *idp;
                    400:        int i, len, start_lvl, end_lvl, pref, ssize;
                    401: #if    REV_ENDIAN_FS
                    402:        int rev_endian=0;
                    403: #endif /* REV_ENDIAN_FS */
                    404: 
                    405:        if (doreallocblks == 0)
                    406:                return (ENOSPC);
                    407:        vp = ap->a_vp;
                    408: #if    REV_ENDIAN_FS
                    409:        rev_endian = vp->v_mount->mnt_flag & MNT_REVEND;
                    410: #endif /* REV_ENDIAN_FS */
                    411: 
                    412:        ip = VTOI(vp);
                    413:        fs = ip->i_fs;
                    414:        if (fs->fs_contigsumsize <= 0)
                    415:                return (ENOSPC);
                    416:        buflist = ap->a_buflist;
                    417:        len = buflist->bs_nchildren;
                    418:        start_lbn = buflist->bs_children[0]->b_lblkno;
                    419:        end_lbn = start_lbn + len - 1;
                    420: #if DIAGNOSTIC
                    421:        for (i = 0; i < len; i++)
                    422:                if (!ffs_checkblk(ip,
                    423:                   dbtofsb(fs, buflist->bs_children[i]->b_blkno), fs->fs_bsize))
                    424:                        panic("ffs_reallocblks: unallocated block 1");
                    425:        for (i = 1; i < len; i++)
                    426:                if (buflist->bs_children[i]->b_lblkno != start_lbn + i)
                    427:                        panic("ffs_reallocblks: non-logical cluster");
                    428:        blkno = buflist->bs_children[0]->b_blkno;
                    429:        ssize = fsbtodb(fs, fs->fs_frag);
                    430:        for (i = 1; i < len - 1; i++)
                    431:                if (buflist->bs_children[i]->b_blkno != blkno + (i * ssize))
                    432:                        panic("ffs_reallocblks: non-physical cluster %d", i);
                    433: #endif
                    434:        /*
                    435:         * If the latest allocation is in a new cylinder group, assume that
                    436:         * the filesystem has decided to move and do not force it back to
                    437:         * the previous cylinder group.
                    438:         */
                    439:        if (dtog(fs, dbtofsb(fs, buflist->bs_children[0]->b_blkno)) !=
                    440:            dtog(fs, dbtofsb(fs, buflist->bs_children[len - 1]->b_blkno)))
                    441:                return (ENOSPC);
                    442:        if (ufs_getlbns(vp, start_lbn, start_ap, &start_lvl) ||
                    443:            ufs_getlbns(vp, end_lbn, end_ap, &end_lvl))
                    444:                return (ENOSPC);
                    445:        /*
                    446:         * Get the starting offset and block map for the first block.
                    447:         */
                    448:        if (start_lvl == 0) {
                    449:                sbap = &ip->i_db[0];
                    450:                soff = start_lbn;
                    451:        } else {
                    452:                idp = &start_ap[start_lvl - 1];
                    453:                if (bread(vp, idp->in_lbn, (int)fs->fs_bsize, NOCRED, &sbp)) {
                    454:                        brelse(sbp);
                    455:                        return (ENOSPC);
                    456:                }
                    457:                sbap = (ufs_daddr_t *)sbp->b_data;
                    458:                soff = idp->in_off;
                    459:        }
                    460:        /*
                    461:         * Find the preferred location for the cluster.
                    462:         */
                    463:        pref = ffs_blkpref(ip, start_lbn, soff, sbap);
                    464:        /*
                    465:         * If the block range spans two block maps, get the second map.
                    466:         */
                    467:        if (end_lvl == 0 || (idp = &end_ap[end_lvl - 1])->in_off + 1 >= len) {
                    468:                ssize = len;
                    469:        } else {
                    470: #if DIAGNOSTIC
                    471:                if (start_lvl && start_ap[start_lvl-1].in_lbn == idp->in_lbn)
                    472:                        panic("ffs_reallocblk: start == end");
                    473: #endif
                    474:                ssize = len - (idp->in_off + 1);
                    475:                if (bread(vp, idp->in_lbn, (int)fs->fs_bsize, NOCRED, &ebp))
                    476:                        goto fail;
                    477:                ebap = (ufs_daddr_t *)ebp->b_data;
                    478:        }
                    479:        /*
                    480:         * Search the block map looking for an allocation of the desired size.
                    481:         */
                    482:        if ((newblk = (ufs_daddr_t)ffs_hashalloc(ip, dtog(fs, pref), (long)pref,
                    483:            len, (u_int32_t (*)())ffs_clusteralloc)) == 0)
                    484:                goto fail;
                    485:        /*
                    486:         * We have found a new contiguous block.
                    487:         *
                    488:         * First we have to replace the old block pointers with the new
                    489:         * block pointers in the inode and indirect blocks associated
                    490:         * with the file.
                    491:         */
                    492: #ifdef DEBUG
                    493:        if (prtrealloc)
                    494:                printf("realloc: ino %d, lbns %d-%d\n\told:", ip->i_number,
                    495:                    start_lbn, end_lbn);
                    496: #endif
                    497:        blkno = newblk;
                    498:        for (bap = &sbap[soff], i = 0; i < len; i++, blkno += fs->fs_frag) {
                    499:                if (i == ssize)
                    500:                        bap = ebap;
                    501: #if DIAGNOSTIC
                    502:                if (!ffs_checkblk(ip,
                    503:                   dbtofsb(fs, buflist->bs_children[i]->b_blkno), fs->fs_bsize))
                    504:                        panic("ffs_reallocblks: unallocated block 2");
                    505: #if REV_ENDIAN_FS
                    506:                if (rev_endian && !(bap >= &ip->i_db[0] && bap <= &ip->i_db[NDADDR-1])) {
                    507:                        if (dbtofsb(fs, buflist->bs_children[i]->b_blkno) != NXSwapLong(*bap))
                    508:                                panic("ffs_reallocblks: alloc mismatch");
                    509:                } else {
                    510: #endif /* REV_ENDIAN_FS */
                    511:                        if (dbtofsb(fs, buflist->bs_children[i]->b_blkno) != *bap)
                    512:                                panic("ffs_reallocblks: alloc mismatch");
                    513: #if REV_ENDIAN_FS
                    514:                }
                    515: #endif /* REV_ENDIAN_FS */
                    516: #endif
                    517: #ifdef DEBUG
                    518: #if REV_ENDIAN_FS
                    519:                if (rev_endian && !(bap >= &ip->i_db[0] && bap <= &ip->i_db[NDADDR-1])) {
                    520:                        if (prtrealloc)
                    521:                                printf(" %d,", NXSwapLong(*bap));
                    522:                }else {
                    523: #endif /* REV_ENDIAN_FS */
                    524:                        if (prtrealloc)
                    525:                                printf(" %d,", *bap);
                    526: #if REV_ENDIAN_FS
                    527:                }
                    528: #endif /* REV_ENDIAN_FS */
                    529: #endif
                    530: #if REV_ENDIAN_FS
                    531:                if (rev_endian && !(bap >= &ip->i_db[0] && bap <= &ip->i_db[NDADDR-1])) {
                    532:                        /* An indirect block need to swap as
                    533:                        *  it is going to be written out directly
                    534:                        */
                    535:                        *bap++ = NXSwapLong(blkno);
                    536:                }
                    537:                else {
                    538:                        /* Direct block; going to be written out
                    539:                        * by a VOP_UPDATE; which takes care of swapping 
                    540:                        */
                    541: #endif /* REV_ENDIAN_FS */
                    542:                        *bap++ = blkno;
                    543: #if REV_ENDIAN_FS
                    544:                }
                    545: #endif /* REV_ENDIAN_FS */
                    546: 
                    547:        }
                    548:        /*
                    549:         * Next we must write out the modified inode and indirect blocks.
                    550:         * For strict correctness, the writes should be synchronous since
                    551:         * the old block values may have been written to disk. In practise
                    552:         * they are almost never written, but if we are concerned about 
                    553:         * strict correctness, the `doasyncfree' flag should be set to zero.
                    554:         *
                    555:         * The test on `doasyncfree' should be changed to test a flag
                    556:         * that shows whether the associated buffers and inodes have
                    557:         * been written. The flag should be set when the cluster is
                    558:         * started and cleared whenever the buffer or inode is flushed.
                    559:         * We can then check below to see if it is set, and do the
                    560:         * synchronous write only when it has been cleared.
                    561:         */
                    562:        if (sbap != &ip->i_db[0]) {
                    563:                if (doasyncfree)
                    564:                        bdwrite(sbp);
                    565:                else
                    566:                        bwrite(sbp);
                    567:        } else {
                    568:                ip->i_flag |= IN_CHANGE | IN_UPDATE;
                    569:                if (!doasyncfree)
                    570:                        VOP_UPDATE(vp, &time, &time, MNT_WAIT);
                    571:        }
                    572:        if (ssize < len)
                    573:                if (doasyncfree)
                    574:                        bdwrite(ebp);
                    575:                else
                    576:                        bwrite(ebp);
                    577:        /*
                    578:         * Last, free the old blocks and assign the new blocks to the buffers.
                    579:         */
                    580: #ifdef DEBUG
                    581:        if (prtrealloc)
                    582:                printf("\n\tnew:");
                    583: #endif
                    584:        for (blkno = newblk, i = 0; i < len; i++, blkno += fs->fs_frag) {
                    585:                ffs_blkfree(ip, dbtofsb(fs, buflist->bs_children[i]->b_blkno),
                    586:                    fs->fs_bsize);
                    587:                buflist->bs_children[i]->b_blkno = fsbtodb(fs, blkno);
                    588: #if DIAGNOSTIC
                    589:                if (!ffs_checkblk(ip,
                    590:                   dbtofsb(fs, buflist->bs_children[i]->b_blkno), fs->fs_bsize))
                    591:                        panic("ffs_reallocblks: unallocated block 3");
                    592:                if (prtrealloc)
                    593:                        printf(" %d,", blkno);
                    594: #endif
                    595:        }
                    596: #ifdef DEBUG
                    597:        if (prtrealloc) {
                    598:                prtrealloc--;
                    599:                printf("\n");
                    600:        }
                    601: #endif
                    602:        return (0);
                    603: 
                    604: fail:
                    605:        if (ssize < len)
                    606:                brelse(ebp);
                    607:        if (sbap != &ip->i_db[0])
                    608:                brelse(sbp);
                    609:        return (ENOSPC);
                    610: }
                    611: 
                    612: /*
                    613:  * Allocate an inode in the file system.
                    614:  * 
                    615:  * If allocating a directory, use ffs_dirpref to select the inode.
                    616:  * If allocating in a directory, the following hierarchy is followed:
                    617:  *   1) allocate the preferred inode.
                    618:  *   2) allocate an inode in the same cylinder group.
                    619:  *   3) quadradically rehash into other cylinder groups, until an
                    620:  *      available inode is located.
                    621:  * If no inode preference is given the following heirarchy is used
                    622:  * to allocate an inode:
                    623:  *   1) allocate an inode in cylinder group 0.
                    624:  *   2) quadradically rehash into other cylinder groups, until an
                    625:  *      available inode is located.
                    626:  */
                    627: int
                    628: ffs_valloc(ap)
                    629:        struct vop_valloc_args /* {
                    630:                struct vnode *a_pvp;
                    631:                int a_mode;
                    632:                struct ucred *a_cred;
                    633:                struct vnode **a_vpp;
                    634:        } */ *ap;
                    635: {
                    636:        register struct vnode *pvp = ap->a_pvp;
                    637:        register struct inode *pip;
                    638:        register struct fs *fs;
                    639:        register struct inode *ip;
                    640:        mode_t mode = ap->a_mode;
                    641:        ino_t ino, ipref;
                    642:        int cg, error;
                    643:        
                    644:        *ap->a_vpp = NULL;
                    645:        pip = VTOI(pvp);
                    646:        fs = pip->i_fs;
                    647:        if (fs->fs_cstotal.cs_nifree == 0)
                    648:                goto noinodes;
                    649: 
                    650:        if ((mode & IFMT) == IFDIR)
                    651:                ipref = ffs_dirpref(fs);
                    652:        else
                    653:                ipref = pip->i_number;
                    654:        if (ipref >= fs->fs_ncg * fs->fs_ipg)
                    655:                ipref = 0;
                    656:        cg = ino_to_cg(fs, ipref);
                    657:        ino = (ino_t)ffs_hashalloc(pip, cg, (long)ipref, mode, ffs_nodealloccg);
                    658:        if (ino == 0)
                    659:                goto noinodes;
                    660:        error = VFS_VGET(pvp->v_mount, ino, ap->a_vpp);
                    661:        if (error) {
                    662:                VOP_VFREE(pvp, ino, mode);
                    663:                return (error);
                    664:        }
                    665:        ip = VTOI(*ap->a_vpp);
                    666:        if (ip->i_mode) {
                    667:                printf("mode = 0%o, inum = %d, fs = %s\n",
                    668:                    ip->i_mode, ip->i_number, fs->fs_fsmnt);
                    669:                panic("ffs_valloc: dup alloc");
                    670:        }
                    671:        if (ip->i_blocks) {                             /* XXX */
                    672:                printf("free inode %s/%d had %d blocks\n",
                    673:                    fs->fs_fsmnt, ino, ip->i_blocks);
                    674:                ip->i_blocks = 0;
                    675:        }
                    676:        ip->i_flags = 0;
                    677:        /*
                    678:         * Set up a new generation number for this inode.
                    679:         */
                    680:        if (++nextgennumber < (u_long)time.tv_sec)
                    681:                nextgennumber = time.tv_sec;
                    682:        ip->i_gen = nextgennumber;
                    683:        return (0);
                    684: noinodes:
                    685:        ffs_fserr(fs, ap->a_cred->cr_uid, "out of inodes");
                    686:        uprintf("\n%s: create/symlink failed, no inodes free\n", fs->fs_fsmnt);
                    687:        return (ENOSPC);
                    688: }
                    689: 
                    690: /*
                    691:  * Find a cylinder to place a directory.
                    692:  *
                    693:  * The policy implemented by this algorithm is to select from
                    694:  * among those cylinder groups with above the average number of
                    695:  * free inodes, the one with the smallest number of directories.
                    696:  */
                    697: static ino_t
                    698: ffs_dirpref(fs)
                    699:        register struct fs *fs;
                    700: {
                    701:        int cg, minndir, mincg, avgifree;
                    702: 
                    703:        avgifree = fs->fs_cstotal.cs_nifree / fs->fs_ncg;
                    704:        minndir = fs->fs_ipg;
                    705:        mincg = 0;
                    706:        for (cg = 0; cg < fs->fs_ncg; cg++)
                    707:                if (fs->fs_cs(fs, cg).cs_ndir < minndir &&
                    708:                    fs->fs_cs(fs, cg).cs_nifree >= avgifree) {
                    709:                        mincg = cg;
                    710:                        minndir = fs->fs_cs(fs, cg).cs_ndir;
                    711:                }
                    712:        return ((ino_t)(fs->fs_ipg * mincg));
                    713: }
                    714: 
                    715: /*
                    716:  * Select the desired position for the next block in a file.  The file is
                    717:  * logically divided into sections. The first section is composed of the
                    718:  * direct blocks. Each additional section contains fs_maxbpg blocks.
                    719:  * 
                    720:  * If no blocks have been allocated in the first section, the policy is to
                    721:  * request a block in the same cylinder group as the inode that describes
                    722:  * the file. If no blocks have been allocated in any other section, the
                    723:  * policy is to place the section in a cylinder group with a greater than
                    724:  * average number of free blocks.  An appropriate cylinder group is found
                    725:  * by using a rotor that sweeps the cylinder groups. When a new group of
                    726:  * blocks is needed, the sweep begins in the cylinder group following the
                    727:  * cylinder group from which the previous allocation was made. The sweep
                    728:  * continues until a cylinder group with greater than the average number
                    729:  * of free blocks is found. If the allocation is for the first block in an
                    730:  * indirect block, the information on the previous allocation is unavailable;
                    731:  * here a best guess is made based upon the logical block number being
                    732:  * allocated.
                    733:  * 
                    734:  * If a section is already partially allocated, the policy is to
                    735:  * contiguously allocate fs_maxcontig blocks.  The end of one of these
                    736:  * contiguous blocks and the beginning of the next is physically separated
                    737:  * so that the disk head will be in transit between them for at least
                    738:  * fs_rotdelay milliseconds.  This is to allow time for the processor to
                    739:  * schedule another I/O transfer.
                    740:  */
                    741: ufs_daddr_t
                    742: ffs_blkpref(ip, lbn, indx, bap)
                    743:        struct inode *ip;
                    744:        ufs_daddr_t lbn;
                    745:        int indx;
                    746:        ufs_daddr_t *bap;
                    747: {
                    748:        register struct fs *fs;
                    749:        register int cg;
                    750:        int avgbfree, startcg;
                    751:        ufs_daddr_t nextblk;
                    752: #if    REV_ENDIAN_FS
                    753:        daddr_t prev=0;
                    754:        struct vnode *vp=ITOV(ip);
                    755:        struct mount *mp=vp->v_mount;
                    756:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                    757: #endif /* REV_ENDIAN_FS */
                    758: 
                    759:        fs = ip->i_fs;
                    760: #if    REV_ENDIAN_FS
                    761:        if (indx && bap) {
                    762:        if (rev_endian) {
                    763:                if (bap != &ip->i_db[0])
                    764:                        prev = NXSwapLong(bap[indx - 1]);
                    765:                else
                    766:                        prev = bap[indx - 1];
                    767:        } else prev = bap[indx - 1];
                    768:        }
                    769:        if (indx % fs->fs_maxbpg == 0 || prev == 0)
                    770: #else  /* REV_ENDIAN_FS */
                    771:        if (indx % fs->fs_maxbpg == 0 || bap[indx - 1] == 0) 
                    772: #endif /* REV_ENDIAN_FS */
                    773:        {
                    774:                if (lbn < NDADDR) {
                    775:                        cg = ino_to_cg(fs, ip->i_number);
                    776:                        return (fs->fs_fpg * cg + fs->fs_frag);
                    777:                }
                    778:                /*
                    779:                 * Find a cylinder with greater than average number of
                    780:                 * unused data blocks.
                    781:                 */
                    782: #if    REV_ENDIAN_FS
                    783:                if (indx == 0 || prev == 0)
                    784: #else  /* REV_ENDIAN_FS */
                    785:                if (indx == 0 || bap[indx - 1] == 0)
                    786: #endif /* REV_ENDIAN_FS */
                    787:                        startcg =
                    788:                            ino_to_cg(fs, ip->i_number) + lbn / fs->fs_maxbpg;
                    789:                else
                    790: #if    REV_ENDIAN_FS
                    791:                        startcg = dtog(fs, prev) + 1;
                    792: #else  /* REV_ENDIAN_FS */
                    793:                        startcg = dtog(fs, bap[indx - 1]) + 1;
                    794: #endif /* REV_ENDIAN_FS */
                    795:                startcg %= fs->fs_ncg;
                    796:                avgbfree = fs->fs_cstotal.cs_nbfree / fs->fs_ncg;
                    797:                for (cg = startcg; cg < fs->fs_ncg; cg++)
                    798:                        if (fs->fs_cs(fs, cg).cs_nbfree >= avgbfree) {
                    799:                                fs->fs_cgrotor = cg;
                    800:                                return (fs->fs_fpg * cg + fs->fs_frag);
                    801:                        }
                    802:                for (cg = 0; cg <= startcg; cg++)
                    803:                        if (fs->fs_cs(fs, cg).cs_nbfree >= avgbfree) {
                    804:                                fs->fs_cgrotor = cg;
                    805:                                return (fs->fs_fpg * cg + fs->fs_frag);
                    806:                        }
                    807:                return (NULL);
                    808:        }
                    809:        /*
                    810:         * One or more previous blocks have been laid out. If less
                    811:         * than fs_maxcontig previous blocks are contiguous, the
                    812:         * next block is requested contiguously, otherwise it is
                    813:         * requested rotationally delayed by fs_rotdelay milliseconds.
                    814:         */
                    815: #if    REV_ENDIAN_FS
                    816:        if (rev_endian) {
                    817:                nextblk = prev + fs->fs_frag;
                    818:                if (indx < fs->fs_maxcontig) {
                    819:                        return (nextblk);
                    820:                }
                    821:                if (bap != &ip->i_db[0])
                    822:                        prev = NXSwapLong(bap[indx - fs->fs_maxcontig]);
                    823:                else
                    824:                        prev = bap[indx - fs->fs_maxcontig];
                    825:                if (prev + blkstofrags(fs, fs->fs_maxcontig) != nextblk)
                    826:                        return (nextblk);
                    827:        } else {
                    828: #endif /* REV_ENDIAN_FS */
                    829:        nextblk = bap[indx - 1] + fs->fs_frag;
                    830:        if (indx < fs->fs_maxcontig || bap[indx - fs->fs_maxcontig] +
                    831:            blkstofrags(fs, fs->fs_maxcontig) != nextblk)
                    832:                return (nextblk);
                    833: #if REV_ENDIAN_FS
                    834:        }
                    835: #endif /* REV_ENDIAN_FS */
                    836:        if (fs->fs_rotdelay != 0)
                    837:                /*
                    838:                 * Here we convert ms of delay to frags as:
                    839:                 * (frags) = (ms) * (rev/sec) * (sect/rev) /
                    840:                 *      ((sect/frag) * (ms/sec))
                    841:                 * then round up to the next block.
                    842:                 */
                    843:                nextblk += roundup(fs->fs_rotdelay * fs->fs_rps * fs->fs_nsect /
                    844:                    (NSPF(fs) * 1000), fs->fs_frag);
                    845:        return (nextblk);
                    846: }
                    847: 
                    848: /*
                    849:  * Implement the cylinder overflow algorithm.
                    850:  *
                    851:  * The policy implemented by this algorithm is:
                    852:  *   1) allocate the block in its requested cylinder group.
                    853:  *   2) quadradically rehash on the cylinder group number.
                    854:  *   3) brute force search for a free block.
                    855:  */
                    856: /*VARARGS5*/
                    857: static u_long
                    858: ffs_hashalloc(ip, cg, pref, size, allocator)
                    859:        struct inode *ip;
                    860:        int cg;
                    861:        long pref;
                    862:        int size;       /* size for data blocks, mode for inodes */
                    863:        u_int32_t (*allocator)();
                    864: {
                    865:        register struct fs *fs;
                    866:        long result;
                    867:        int i, icg = cg;
                    868: 
                    869:        fs = ip->i_fs;
                    870:        /*
                    871:         * 1: preferred cylinder group
                    872:         */
                    873:        result = (*allocator)(ip, cg, pref, size);
                    874:        if (result)
                    875:                return (result);
                    876:        /*
                    877:         * 2: quadratic rehash
                    878:         */
                    879:        for (i = 1; i < fs->fs_ncg; i *= 2) {
                    880:                cg += i;
                    881:                if (cg >= fs->fs_ncg)
                    882:                        cg -= fs->fs_ncg;
                    883:                result = (*allocator)(ip, cg, 0, size);
                    884:                if (result)
                    885:                        return (result);
                    886:        }
                    887:        /*
                    888:         * 3: brute force search
                    889:         * Note that we start at i == 2, since 0 was checked initially,
                    890:         * and 1 is always checked in the quadratic rehash.
                    891:         */
                    892:        cg = (icg + 2) % fs->fs_ncg;
                    893:        for (i = 2; i < fs->fs_ncg; i++) {
                    894:                result = (*allocator)(ip, cg, 0, size);
                    895:                if (result)
                    896:                        return (result);
                    897:                cg++;
                    898:                if (cg == fs->fs_ncg)
                    899:                        cg = 0;
                    900:        }
                    901:        return (NULL);
                    902: }
                    903: 
                    904: /*
                    905:  * Determine whether a fragment can be extended.
                    906:  *
                    907:  * Check to see if the necessary fragments are available, and 
                    908:  * if they are, allocate them.
                    909:  */
                    910: static ufs_daddr_t
                    911: ffs_fragextend(ip, cg, bprev, osize, nsize)
                    912:        struct inode *ip;
                    913:        int cg;
                    914:        long bprev;
                    915:        int osize, nsize;
                    916: {
                    917:        register struct fs *fs;
                    918:        register struct cg *cgp;
                    919:        struct buf *bp;
                    920:        long bno;
                    921:        int frags, bbase;
                    922:        int i, error;
                    923: #if REV_ENDIAN_FS
                    924:        struct vnode *vp=ITOV(ip);
                    925:        struct mount *mp=vp->v_mount;
                    926:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                    927: #endif /* REV_ENDIAN_FS */
                    928: 
                    929:        fs = ip->i_fs;
                    930:        if (fs->fs_cs(fs, cg).cs_nffree < numfrags(fs, nsize - osize))
                    931:                return (NULL);
                    932:        frags = numfrags(fs, nsize);
                    933:        bbase = fragnum(fs, bprev);
                    934:        if (bbase > fragnum(fs, (bprev + frags - 1))) {
                    935:                /* cannot extend across a block boundary */
                    936:                return (NULL);
                    937:        }
                    938:        error = bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, cg)),
                    939:                (int)fs->fs_cgsize, NOCRED, &bp);
                    940:        if (error) {
                    941:                brelse(bp);
                    942:                return (NULL);
                    943:        }
                    944:        cgp = (struct cg *)bp->b_data;
                    945: #if REV_ENDIAN_FS
                    946:        if (rev_endian) {
                    947:                byte_swap_cgin(cgp, fs);
                    948:        }
                    949: #endif /* REV_ENDIAN_FS */
                    950: 
                    951:        if (!cg_chkmagic(cgp)) {
                    952: #if REV_ENDIAN_FS
                    953:                if (rev_endian)
                    954:                        byte_swap_cgout(cgp,fs);
                    955: #endif /* REV_ENDIAN_FS */
                    956:                brelse(bp);
                    957:                return (NULL);
                    958:        }
                    959:        cgp->cg_time = time.tv_sec;
                    960:        bno = dtogd(fs, bprev);
                    961:        for (i = numfrags(fs, osize); i < frags; i++)
                    962:                if (isclr(cg_blksfree(cgp), bno + i)) {
                    963: #if REV_ENDIAN_FS
                    964:                        if (rev_endian)
                    965:                                byte_swap_cgout(cgp,fs);
                    966: #endif /* REV_ENDIAN_FS */
                    967:                        brelse(bp);
                    968:                        return (NULL);
                    969:                }
                    970:        /*
                    971:         * the current fragment can be extended
                    972:         * deduct the count on fragment being extended into
                    973:         * increase the count on the remaining fragment (if any)
                    974:         * allocate the extended piece
                    975:         */
                    976:        for (i = frags; i < fs->fs_frag - bbase; i++)
                    977:                if (isclr(cg_blksfree(cgp), bno + i))
                    978:                        break;
                    979:        cgp->cg_frsum[i - numfrags(fs, osize)]--;
                    980:        if (i != frags)
                    981:                cgp->cg_frsum[i - frags]++;
                    982:        for (i = numfrags(fs, osize); i < frags; i++) {
                    983:                clrbit(cg_blksfree(cgp), bno + i);
                    984:                cgp->cg_cs.cs_nffree--;
                    985:                fs->fs_cstotal.cs_nffree--;
                    986:                fs->fs_cs(fs, cg).cs_nffree--;
                    987:        }
                    988:        fs->fs_fmod = 1;
                    989: #if REV_ENDIAN_FS
                    990:        if (rev_endian)
                    991:                byte_swap_cgout(cgp,fs);
                    992: #endif /* REV_ENDIAN_FS */
                    993:        bdwrite(bp);
                    994:        return (bprev);
                    995: }
                    996: 
                    997: /*
                    998:  * Determine whether a block can be allocated.
                    999:  *
                   1000:  * Check to see if a block of the appropriate size is available,
                   1001:  * and if it is, allocate it.
                   1002:  */
                   1003: static ufs_daddr_t
                   1004: ffs_alloccg(ip, cg, bpref, size)
                   1005:        struct inode *ip;
                   1006:        int cg;
                   1007:        ufs_daddr_t bpref;
                   1008:        int size;
                   1009: {
                   1010:        register struct fs *fs;
                   1011:        register struct cg *cgp;
                   1012:        struct buf *bp;
                   1013:        register int i;
                   1014:        int error, bno, frags, allocsiz;
                   1015: #if REV_ENDIAN_FS
                   1016:        struct vnode *vp=ITOV(ip);
                   1017:        struct mount *mp=vp->v_mount;
                   1018:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1019: #endif /* REV_ENDIAN_FS */
                   1020: 
                   1021:        fs = ip->i_fs;
                   1022:        if (fs->fs_cs(fs, cg).cs_nbfree == 0 && size == fs->fs_bsize)
                   1023:                return (NULL);
                   1024:        error = bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, cg)),
                   1025:                (int)fs->fs_cgsize, NOCRED, &bp);
                   1026:        if (error) {
                   1027:                brelse(bp);
                   1028:                return (NULL);
                   1029:        }
                   1030:        cgp = (struct cg *)bp->b_data;
                   1031: #if REV_ENDIAN_FS
                   1032:        if (rev_endian)
                   1033:                byte_swap_cgin(cgp,fs);
                   1034: #endif /* REV_ENDIAN_FS */
                   1035:        if (!cg_chkmagic(cgp) ||
                   1036:            (cgp->cg_cs.cs_nbfree == 0 && size == fs->fs_bsize)) {
                   1037: #if REV_ENDIAN_FS
                   1038:                if (rev_endian)
                   1039:                        byte_swap_cgout(cgp,fs);
                   1040: #endif /* REV_ENDIAN_FS */
                   1041:                brelse(bp);
                   1042:                return (NULL);
                   1043:        }
                   1044:        cgp->cg_time = time.tv_sec;
                   1045:        if (size == fs->fs_bsize) {
                   1046:                bno = ffs_alloccgblk(fs, cgp, bpref);
                   1047: #if REV_ENDIAN_FS
                   1048:                if (rev_endian)
                   1049:                        byte_swap_cgout(cgp,fs);
                   1050: #endif /* REV_ENDIAN_FS */
                   1051:                bdwrite(bp);
                   1052:                return (bno);
                   1053:        }
                   1054:        /*
                   1055:         * check to see if any fragments are already available
                   1056:         * allocsiz is the size which will be allocated, hacking
                   1057:         * it down to a smaller size if necessary
                   1058:         */
                   1059:        frags = numfrags(fs, size);
                   1060:        for (allocsiz = frags; allocsiz < fs->fs_frag; allocsiz++)
                   1061:                if (cgp->cg_frsum[allocsiz] != 0)
                   1062:                        break;
                   1063:        if (allocsiz == fs->fs_frag) {
                   1064:                /*
                   1065:                 * no fragments were available, so a block will be 
                   1066:                 * allocated, and hacked up
                   1067:                 */
                   1068:                if (cgp->cg_cs.cs_nbfree == 0) {
                   1069: #if    REV_ENDIAN_FS
                   1070:                        if (rev_endian)
                   1071:                                byte_swap_cgout(cgp,fs);
                   1072: #endif /* REV_ENDIAN_FS */
                   1073:                        brelse(bp);
                   1074:                        return (NULL);
                   1075:                }
                   1076:                bno = ffs_alloccgblk(fs, cgp, bpref);
                   1077:                bpref = dtogd(fs, bno);
                   1078:                for (i = frags; i < fs->fs_frag; i++)
                   1079:                        setbit(cg_blksfree(cgp), bpref + i);
                   1080:                i = fs->fs_frag - frags;
                   1081:                cgp->cg_cs.cs_nffree += i;
                   1082:                fs->fs_cstotal.cs_nffree += i;
                   1083:                fs->fs_cs(fs, cg).cs_nffree += i;
                   1084:                fs->fs_fmod = 1;
                   1085:                cgp->cg_frsum[i]++;
                   1086: #if    REV_ENDIAN_FS
                   1087:                if (rev_endian)
                   1088:                        byte_swap_cgout(cgp,fs);
                   1089: #endif /* REV_ENDIAN_FS */
                   1090:                bdwrite(bp);
                   1091:                return (bno);
                   1092:        }
                   1093:        bno = ffs_mapsearch(fs, cgp, bpref, allocsiz);
                   1094:        if (bno < 0) {
                   1095: #if    REV_ENDIAN_FS
                   1096:                if (rev_endian)
                   1097:                        byte_swap_cgout(cgp,fs);
                   1098: #endif /* REV_ENDIAN_FS */
                   1099:                brelse(bp);
                   1100:                return (NULL);
                   1101:        }
                   1102:        for (i = 0; i < frags; i++)
                   1103:                clrbit(cg_blksfree(cgp), bno + i);
                   1104:        cgp->cg_cs.cs_nffree -= frags;
                   1105:        fs->fs_cstotal.cs_nffree -= frags;
                   1106:        fs->fs_cs(fs, cg).cs_nffree -= frags;
                   1107:        fs->fs_fmod = 1;
                   1108:        cgp->cg_frsum[allocsiz]--;
                   1109:        if (frags != allocsiz)
                   1110:                cgp->cg_frsum[allocsiz - frags]++;
                   1111: #if    REV_ENDIAN_FS
                   1112:        if (rev_endian)
                   1113:                byte_swap_cgout(cgp,fs);
                   1114: #endif /* REV_ENDIAN_FS */
                   1115:        bdwrite(bp);
                   1116:        return (cg * fs->fs_fpg + bno);
                   1117: }
                   1118: 
                   1119: /*
                   1120:  * Allocate a block in a cylinder group.
                   1121:  *
                   1122:  * This algorithm implements the following policy:
                   1123:  *   1) allocate the requested block.
                   1124:  *   2) allocate a rotationally optimal block in the same cylinder.
                   1125:  *   3) allocate the next available block on the block rotor for the
                   1126:  *      specified cylinder group.
                   1127:  * Note that this routine only allocates fs_bsize blocks; these
                   1128:  * blocks may be fragmented by the routine that allocates them.
                   1129:  */
                   1130: static ufs_daddr_t
                   1131: ffs_alloccgblk(fs, cgp, bpref)
                   1132:        register struct fs *fs;
                   1133:        register struct cg *cgp;
                   1134:        ufs_daddr_t bpref;
                   1135: {
                   1136:        ufs_daddr_t bno, blkno;
                   1137:        int cylno, pos, delta;
                   1138:        short *cylbp;
                   1139:        register int i;
                   1140: 
                   1141:        if (bpref == 0 || dtog(fs, bpref) != cgp->cg_cgx) {
                   1142:                bpref = cgp->cg_rotor;
                   1143:                goto norot;
                   1144:        }
                   1145:        bpref = blknum(fs, bpref);
                   1146:        bpref = dtogd(fs, bpref);
                   1147:        /*
                   1148:         * if the requested block is available, use it
                   1149:         */
                   1150:        if (ffs_isblock(fs, cg_blksfree(cgp), fragstoblks(fs, bpref))) {
                   1151:                bno = bpref;
                   1152:                goto gotit;
                   1153:        }
                   1154:        if (fs->fs_nrpos <= 1 || fs->fs_cpc == 0) {
                   1155:                /*
                   1156:                 * Block layout information is not available.
                   1157:                 * Leaving bpref unchanged means we take the
                   1158:                 * next available free block following the one 
                   1159:                 * we just allocated. Hopefully this will at
                   1160:                 * least hit a track cache on drives of unknown
                   1161:                 * geometry (e.g. SCSI).
                   1162:                 */
                   1163:                goto norot;
                   1164:        }
                   1165:        /*
                   1166:         * check for a block available on the same cylinder
                   1167:         */
                   1168:        cylno = cbtocylno(fs, bpref);
                   1169:        if (cg_blktot(cgp)[cylno] == 0)
                   1170:                goto norot;
                   1171:        /*
                   1172:         * check the summary information to see if a block is 
                   1173:         * available in the requested cylinder starting at the
                   1174:         * requested rotational position and proceeding around.
                   1175:         */
                   1176:        cylbp = cg_blks(fs, cgp, cylno);
                   1177:        pos = cbtorpos(fs, bpref);
                   1178:        for (i = pos; i < fs->fs_nrpos; i++)
                   1179:                if (cylbp[i] > 0)
                   1180:                        break;
                   1181:        if (i == fs->fs_nrpos)
                   1182:                for (i = 0; i < pos; i++)
                   1183:                        if (cylbp[i] > 0)
                   1184:                                break;
                   1185:        if (cylbp[i] > 0) {
                   1186:                /*
                   1187:                 * found a rotational position, now find the actual
                   1188:                 * block. A panic if none is actually there.
                   1189:                 */
                   1190:                pos = cylno % fs->fs_cpc;
                   1191:                bno = (cylno - pos) * fs->fs_spc / NSPB(fs);
                   1192:                if (fs_postbl(fs, pos)[i] == -1) {
                   1193:                        printf("pos = %d, i = %d, fs = %s\n",
                   1194:                            pos, i, fs->fs_fsmnt);
                   1195:                        panic("ffs_alloccgblk: cyl groups corrupted");
                   1196:                }
                   1197:                for (i = fs_postbl(fs, pos)[i];; ) {
                   1198:                        if (ffs_isblock(fs, cg_blksfree(cgp), bno + i)) {
                   1199:                                bno = blkstofrags(fs, (bno + i));
                   1200:                                goto gotit;
                   1201:                        }
                   1202:                        delta = fs_rotbl(fs)[i];
                   1203:                        if (delta <= 0 ||
                   1204:                            delta + i > fragstoblks(fs, fs->fs_fpg))
                   1205:                                break;
                   1206:                        i += delta;
                   1207:                }
                   1208:                printf("pos = %d, i = %d, fs = %s\n", pos, i, fs->fs_fsmnt);
                   1209:                panic("ffs_alloccgblk: can't find blk in cyl");
                   1210:        }
                   1211: norot:
                   1212:        /*
                   1213:         * no blocks in the requested cylinder, so take next
                   1214:         * available one in this cylinder group.
                   1215:         */
                   1216:        bno = ffs_mapsearch(fs, cgp, bpref, (int)fs->fs_frag);
                   1217:        if (bno < 0)
                   1218:                return (NULL);
                   1219:        cgp->cg_rotor = bno;
                   1220: gotit:
                   1221:        blkno = fragstoblks(fs, bno);
                   1222:        ffs_clrblock(fs, cg_blksfree(cgp), (long)blkno);
                   1223:        ffs_clusteracct(fs, cgp, blkno, -1);
                   1224:        cgp->cg_cs.cs_nbfree--;
                   1225:        fs->fs_cstotal.cs_nbfree--;
                   1226:        fs->fs_cs(fs, cgp->cg_cgx).cs_nbfree--;
                   1227:        cylno = cbtocylno(fs, bno);
                   1228:        cg_blks(fs, cgp, cylno)[cbtorpos(fs, bno)]--;
                   1229:        cg_blktot(cgp)[cylno]--;
                   1230:        fs->fs_fmod = 1;
                   1231:        return (cgp->cg_cgx * fs->fs_fpg + bno);
                   1232: }
                   1233: 
                   1234: /*
                   1235:  * Determine whether a cluster can be allocated.
                   1236:  *
                   1237:  * We do not currently check for optimal rotational layout if there
                   1238:  * are multiple choices in the same cylinder group. Instead we just
                   1239:  * take the first one that we find following bpref.
                   1240:  */
                   1241: static ufs_daddr_t
                   1242: ffs_clusteralloc(ip, cg, bpref, len)
                   1243:        struct inode *ip;
                   1244:        int cg;
                   1245:        ufs_daddr_t bpref;
                   1246:        int len;
                   1247: {
                   1248:        register struct fs *fs;
                   1249:        register struct cg *cgp;
                   1250:        struct buf *bp;
                   1251:        int i, got, run, bno, bit, map;
                   1252:        u_char *mapp;
                   1253:        int32_t *lp;
                   1254: #if REV_ENDIAN_FS
                   1255:        struct vnode *vp=ITOV(ip);
                   1256:        struct mount *mp=vp->v_mount;
                   1257:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1258: #endif /* REV_ENDIAN_FS */
                   1259: 
                   1260:        fs = ip->i_fs;
                   1261:        if (fs->fs_maxcluster[cg] < len)
                   1262:                return (NULL);
                   1263:        if (bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, cg)), (int)fs->fs_cgsize,
                   1264:            NOCRED, &bp))
                   1265:                goto fail;
                   1266:        cgp = (struct cg *)bp->b_data;
                   1267: #if    REV_ENDIAN_FS
                   1268:        if (rev_endian)
                   1269:                byte_swap_cgin(cgp,fs);
                   1270: #endif /* REV_ENDIAN_FS */
                   1271:        if (!cg_chkmagic(cgp)) {
                   1272: #if    REV_ENDIAN_FS
                   1273:                if (rev_endian)
                   1274:                        byte_swap_cgout(cgp,fs);
                   1275: #endif /* REV_ENDIAN_FS */
                   1276:                goto fail;
                   1277:        }
                   1278:        /*
                   1279:         * Check to see if a cluster of the needed size (or bigger) is
                   1280:         * available in this cylinder group.
                   1281:         */
                   1282:        lp = &cg_clustersum(cgp)[len];
                   1283:        for (i = len; i <= fs->fs_contigsumsize; i++)
                   1284:                if (*lp++ > 0)
                   1285:                        break;
                   1286:        if (i > fs->fs_contigsumsize) {
                   1287:                /*
                   1288:                 * This is the first time looking for a cluster in this
                   1289:                 * cylinder group. Update the cluster summary information
                   1290:                 * to reflect the true maximum sized cluster so that
                   1291:                 * future cluster allocation requests can avoid reading
                   1292:                 * the cylinder group map only to find no clusters.
                   1293:                 */
                   1294:                lp = &cg_clustersum(cgp)[len - 1];
                   1295:                for (i = len - 1; i > 0; i--)
                   1296:                        if (*lp-- > 0)
                   1297:                                break;
                   1298:                fs->fs_maxcluster[cg] = i;
                   1299: #if    REV_ENDIAN_FS
                   1300:                if (rev_endian)
                   1301:                        byte_swap_cgout(cgp,fs);
                   1302: #endif /* REV_ENDIAN_FS */
                   1303:                goto fail;
                   1304:        }
                   1305:        /*
                   1306:         * Search the cluster map to find a big enough cluster.
                   1307:         * We take the first one that we find, even if it is larger
                   1308:         * than we need as we prefer to get one close to the previous
                   1309:         * block allocation. We do not search before the current
                   1310:         * preference point as we do not want to allocate a block
                   1311:         * that is allocated before the previous one (as we will
                   1312:         * then have to wait for another pass of the elevator
                   1313:         * algorithm before it will be read). We prefer to fail and
                   1314:         * be recalled to try an allocation in the next cylinder group.
                   1315:         */
                   1316:        if (dtog(fs, bpref) != cg)
                   1317:                bpref = 0;
                   1318:        else
                   1319:                bpref = fragstoblks(fs, dtogd(fs, blknum(fs, bpref)));
                   1320:        mapp = &cg_clustersfree(cgp)[bpref / NBBY];
                   1321:        map = *mapp++;
                   1322:        bit = 1 << (bpref % NBBY);
                   1323:        for (run = 0, got = bpref; got < cgp->cg_nclusterblks; got++) {
                   1324:                if ((map & bit) == 0) {
                   1325:                        run = 0;
                   1326:                } else {
                   1327:                        run++;
                   1328:                        if (run == len)
                   1329:                                break;
                   1330:                }
                   1331:                if ((got & (NBBY - 1)) != (NBBY - 1)) {
                   1332:                        bit <<= 1;
                   1333:                } else {
                   1334:                        map = *mapp++;
                   1335:                        bit = 1;
                   1336:                }
                   1337:        }
                   1338:        if (got == cgp->cg_nclusterblks) {
                   1339: #if    REV_ENDIAN_FS
                   1340:                if (rev_endian)
                   1341:                        byte_swap_cgout(cgp,fs);
                   1342: #endif /* REV_ENDIAN_FS */
                   1343:                goto fail;
                   1344:        }
                   1345:        /*
                   1346:         * Allocate the cluster that we have found.
                   1347:         */
                   1348:        for (i = 1; i <= len; i++)
                   1349:                if (!ffs_isblock(fs, cg_blksfree(cgp), got - run + i))
                   1350:                        panic("ffs_clusteralloc: map mismatch");
                   1351:        bno = cg * fs->fs_fpg + blkstofrags(fs, got - run + 1);
                   1352:        if (dtog(fs, bno) != cg)
                   1353:                panic("ffs_clusteralloc: allocated out of group");
                   1354:        len = blkstofrags(fs, len);
                   1355:        for (i = 0; i < len; i += fs->fs_frag)
                   1356:                if ((got = ffs_alloccgblk(fs, cgp, bno + i)) != bno + i)
                   1357:                        panic("ffs_clusteralloc: lost block");
                   1358: #if    REV_ENDIAN_FS
                   1359:        if (rev_endian)
                   1360:                byte_swap_cgout(cgp,fs);
                   1361: #endif /* REV_ENDIAN_FS */
                   1362:        bdwrite(bp);
                   1363:        return (bno);
                   1364: 
                   1365: fail:
                   1366:        brelse(bp);
                   1367:        return (0);
                   1368: }
                   1369: 
                   1370: /*
                   1371:  * Determine whether an inode can be allocated.
                   1372:  *
                   1373:  * Check to see if an inode is available, and if it is,
                   1374:  * allocate it using the following policy:
                   1375:  *   1) allocate the requested inode.
                   1376:  *   2) allocate the next available inode after the requested
                   1377:  *      inode in the specified cylinder group.
                   1378:  */
                   1379: static ino_t
                   1380: ffs_nodealloccg(ip, cg, ipref, mode)
                   1381:        struct inode *ip;
                   1382:        int cg;
                   1383:        ufs_daddr_t ipref;
                   1384:        int mode;
                   1385: {
                   1386:        register struct fs *fs;
                   1387:        register struct cg *cgp;
                   1388:        struct buf *bp;
                   1389:        int error, start, len, loc, map, i;
                   1390: #if REV_ENDIAN_FS
                   1391:        struct vnode *vp=ITOV(ip);
                   1392:        struct mount *mp=vp->v_mount;
                   1393:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1394: #endif /* REV_ENDIAN_FS */
                   1395: 
                   1396:        fs = ip->i_fs;
                   1397:        if (fs->fs_cs(fs, cg).cs_nifree == 0)
                   1398:                return (NULL);
                   1399:        error = bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, cg)),
                   1400:                (int)fs->fs_cgsize, NOCRED, &bp);
                   1401:        if (error) {
                   1402:                brelse(bp);
                   1403:                return (NULL);
                   1404:        }
                   1405:        cgp = (struct cg *)bp->b_data;
                   1406: #if REV_ENDIAN_FS
                   1407:        if (rev_endian)
                   1408:                byte_swap_cgin(cgp,fs);
                   1409: #endif /* REV_ENDIAN_FS */
                   1410:        if (!cg_chkmagic(cgp) || cgp->cg_cs.cs_nifree == 0) {
                   1411: #if REV_ENDIAN_FS
                   1412:                if (rev_endian)
                   1413:                        byte_swap_cgout(cgp,fs);
                   1414: #endif /* REV_ENDIAN_FS */
                   1415:                brelse(bp);
                   1416:                return (NULL);
                   1417:        }
                   1418: 
                   1419:        cgp->cg_time = time.tv_sec;
                   1420:        if (ipref) {
                   1421:                ipref %= fs->fs_ipg;
                   1422:                if (isclr(cg_inosused(cgp), ipref))
                   1423:                        goto gotit;
                   1424:        }
                   1425:        start = cgp->cg_irotor / NBBY;
                   1426:        len = howmany(fs->fs_ipg - cgp->cg_irotor, NBBY);
                   1427:        loc = skpc(0xff, len, &cg_inosused(cgp)[start]);
                   1428:        if (loc == 0) {
                   1429:                len = start + 1;
                   1430:                start = 0;
                   1431:                loc = skpc(0xff, len, &cg_inosused(cgp)[0]);
                   1432:                if (loc == 0) {
                   1433:                        printf("cg = %d, irotor = %d, fs = %s\n",
                   1434:                            cg, cgp->cg_irotor, fs->fs_fsmnt);
                   1435:                        panic("ffs_nodealloccg: map corrupted");
                   1436:                        /* NOTREACHED */
                   1437:                }
                   1438:        }
                   1439:        i = start + len - loc;
                   1440:        map = cg_inosused(cgp)[i];
                   1441:        ipref = i * NBBY;
                   1442:        for (i = 1; i < (1 << NBBY); i <<= 1, ipref++) {
                   1443:                if ((map & i) == 0) {
                   1444:                        cgp->cg_irotor = ipref;
                   1445:                        goto gotit;
                   1446:                }
                   1447:        }
                   1448:        printf("fs = %s\n", fs->fs_fsmnt);
                   1449:        panic("ffs_nodealloccg: block not in map");
                   1450:        /* NOTREACHED */
                   1451: gotit:
                   1452:        setbit(cg_inosused(cgp), ipref);
                   1453:        cgp->cg_cs.cs_nifree--;
                   1454:        fs->fs_cstotal.cs_nifree--;
                   1455:        fs->fs_cs(fs, cg).cs_nifree--;
                   1456:        fs->fs_fmod = 1;
                   1457:        if ((mode & IFMT) == IFDIR) {
                   1458:                cgp->cg_cs.cs_ndir++;
                   1459:                fs->fs_cstotal.cs_ndir++;
                   1460:                fs->fs_cs(fs, cg).cs_ndir++;
                   1461:        }
                   1462: #if REV_ENDIAN_FS
                   1463:        if (rev_endian)
                   1464:                byte_swap_cgout(cgp,fs);
                   1465: #endif /* REV_ENDIAN_FS */
                   1466:        bdwrite(bp);
                   1467:        return (cg * fs->fs_ipg + ipref);
                   1468: }
                   1469: 
                   1470: /*
                   1471:  * Free a block or fragment.
                   1472:  *
                   1473:  * The specified block or fragment is placed back in the
                   1474:  * free map. If a fragment is deallocated, a possible 
                   1475:  * block reassembly is checked.
                   1476:  */
                   1477: ffs_blkfree(ip, bno, size)
                   1478:        register struct inode *ip;
                   1479:        ufs_daddr_t bno;
                   1480:        long size;
                   1481: {
                   1482:        register struct fs *fs;
                   1483:        register struct cg *cgp;
                   1484:        struct buf *bp;
                   1485:        ufs_daddr_t blkno;
                   1486:        int i, error, cg, blk, frags, bbase;
                   1487: #if REV_ENDIAN_FS
                   1488:        struct vnode *vp=ITOV(ip);
                   1489:        struct mount *mp=vp->v_mount;
                   1490:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1491: #endif /* REV_ENDIAN_FS */
                   1492:        fs = ip->i_fs;
                   1493:        if ((u_int)size > fs->fs_bsize || fragoff(fs, size) != 0) {
                   1494:                printf("dev = 0x%x, bsize = %d, size = %d, fs = %s\n",
                   1495:                    ip->i_dev, fs->fs_bsize, size, fs->fs_fsmnt);
                   1496:                panic("blkfree: bad size");
                   1497:        }
                   1498:        cg = dtog(fs, bno);
                   1499:        if ((u_int)bno >= fs->fs_size) {
                   1500:                printf("bad block %d, ino %d\n", bno, ip->i_number);
                   1501:                ffs_fserr(fs, ip->i_uid, "bad block");
                   1502:                return;
                   1503:        }
                   1504:        error = bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, cg)),
                   1505:                (int)fs->fs_cgsize, NOCRED, &bp);
                   1506:        if (error) {
                   1507:                brelse(bp);
                   1508:                return;
                   1509:        }
                   1510:        cgp = (struct cg *)bp->b_data;
                   1511: #if REV_ENDIAN_FS
                   1512:        if (rev_endian)
                   1513:                byte_swap_cgin(cgp,fs);
                   1514: #endif /* REV_ENDIAN_FS */
                   1515:        if (!cg_chkmagic(cgp)) {
                   1516: #if REV_ENDIAN_FS
                   1517:                if (rev_endian)
                   1518:                        byte_swap_cgout(cgp,fs);
                   1519: #endif /* REV_ENDIAN_FS */
                   1520:                brelse(bp);
                   1521:                return;
                   1522:        }
                   1523:        cgp->cg_time = time.tv_sec;
                   1524:        bno = dtogd(fs, bno);
                   1525:        if (size == fs->fs_bsize) {
                   1526:                blkno = fragstoblks(fs, bno);
                   1527:                if (ffs_isblock(fs, cg_blksfree(cgp), blkno)) {
                   1528:                        printf("dev = 0x%x, block = %d, fs = %s\n",
                   1529:                            ip->i_dev, bno, fs->fs_fsmnt);
                   1530:                        panic("blkfree: freeing free block");
                   1531:                }
                   1532:                ffs_setblock(fs, cg_blksfree(cgp), blkno);
                   1533:                ffs_clusteracct(fs, cgp, blkno, 1);
                   1534:                cgp->cg_cs.cs_nbfree++;
                   1535:                fs->fs_cstotal.cs_nbfree++;
                   1536:                fs->fs_cs(fs, cg).cs_nbfree++;
                   1537:                i = cbtocylno(fs, bno);
                   1538:                cg_blks(fs, cgp, i)[cbtorpos(fs, bno)]++;
                   1539:                cg_blktot(cgp)[i]++;
                   1540:        } else {
                   1541:                bbase = bno - fragnum(fs, bno);
                   1542:                /*
                   1543:                 * decrement the counts associated with the old frags
                   1544:                 */
                   1545:                blk = blkmap(fs, cg_blksfree(cgp), bbase);
                   1546:                ffs_fragacct(fs, blk, cgp->cg_frsum, -1);
                   1547:                /*
                   1548:                 * deallocate the fragment
                   1549:                 */
                   1550:                frags = numfrags(fs, size);
                   1551:                for (i = 0; i < frags; i++) {
                   1552:                        if (isset(cg_blksfree(cgp), bno + i)) {
                   1553:                                printf("dev = 0x%x, block = %d, fs = %s\n",
                   1554:                                    ip->i_dev, bno + i, fs->fs_fsmnt);
                   1555:                                panic("blkfree: freeing free frag");
                   1556:                        }
                   1557:                        setbit(cg_blksfree(cgp), bno + i);
                   1558:                }
                   1559:                cgp->cg_cs.cs_nffree += i;
                   1560:                fs->fs_cstotal.cs_nffree += i;
                   1561:                fs->fs_cs(fs, cg).cs_nffree += i;
                   1562:                /*
                   1563:                 * add back in counts associated with the new frags
                   1564:                 */
                   1565:                blk = blkmap(fs, cg_blksfree(cgp), bbase);
                   1566:                ffs_fragacct(fs, blk, cgp->cg_frsum, 1);
                   1567:                /*
                   1568:                 * if a complete block has been reassembled, account for it
                   1569:                 */
                   1570:                blkno = fragstoblks(fs, bbase);
                   1571:                if (ffs_isblock(fs, cg_blksfree(cgp), blkno)) {
                   1572:                        cgp->cg_cs.cs_nffree -= fs->fs_frag;
                   1573:                        fs->fs_cstotal.cs_nffree -= fs->fs_frag;
                   1574:                        fs->fs_cs(fs, cg).cs_nffree -= fs->fs_frag;
                   1575:                        ffs_clusteracct(fs, cgp, blkno, 1);
                   1576:                        cgp->cg_cs.cs_nbfree++;
                   1577:                        fs->fs_cstotal.cs_nbfree++;
                   1578:                        fs->fs_cs(fs, cg).cs_nbfree++;
                   1579:                        i = cbtocylno(fs, bbase);
                   1580:                        cg_blks(fs, cgp, i)[cbtorpos(fs, bbase)]++;
                   1581:                        cg_blktot(cgp)[i]++;
                   1582:                }
                   1583:        }
                   1584:        fs->fs_fmod = 1;
                   1585: #if REV_ENDIAN_FS
                   1586:        if (rev_endian)
                   1587:                byte_swap_cgout(cgp,fs);
                   1588: #endif /* REV_ENDIAN_FS */
                   1589:        bdwrite(bp);
                   1590: }
                   1591: 
                   1592: #if DIAGNOSTIC
                   1593: /*
                   1594:  * Verify allocation of a block or fragment. Returns true if block or
                   1595:  * fragment is allocated, false if it is free.
                   1596:  */
                   1597: ffs_checkblk(ip, bno, size)
                   1598:        struct inode *ip;
                   1599:        ufs_daddr_t bno;
                   1600:        long size;
                   1601: {
                   1602:        struct fs *fs;
                   1603:        struct cg *cgp;
                   1604:        struct buf *bp;
                   1605:        int i, error, frags, free;
                   1606: #if REV_ENDIAN_FS
                   1607:        struct vnode *vp=ITOV(ip);
                   1608:        struct mount *mp=vp->v_mount;
                   1609:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1610: #endif /* REV_ENDIAN_FS */
                   1611: 
                   1612:        fs = ip->i_fs;
                   1613:        if ((u_int)size > fs->fs_bsize || fragoff(fs, size) != 0) {
                   1614:                printf("bsize = %d, size = %d, fs = %s\n",
                   1615:                    fs->fs_bsize, size, fs->fs_fsmnt);
                   1616:                panic("checkblk: bad size");
                   1617:        }
                   1618:        if ((u_int)bno >= fs->fs_size)
                   1619:                panic("checkblk: bad block %d", bno);
                   1620:        error = bread(ip->i_devvp, fsbtodb(fs, cgtod(fs, dtog(fs, bno))),
                   1621:                (int)fs->fs_cgsize, NOCRED, &bp);
                   1622:        if (error) {
                   1623:                brelse(bp);
                   1624:                return;
                   1625:        }
                   1626:        cgp = (struct cg *)bp->b_data;
                   1627: #if REV_ENDIAN_FS
                   1628:        if (rev_endian)
                   1629:                byte_swap_cgin(cgp,fs);
                   1630: #endif /* REV_ENDIAN_FS */
                   1631:        if (!cg_chkmagic(cgp)) {
                   1632: #if REV_ENDIAN_FS
                   1633:                if (rev_endian)
                   1634:                        byte_swap_cgout(cgp,fs);
                   1635: #endif /* REV_ENDIAN_FS */
                   1636:                brelse(bp);
                   1637:                return;
                   1638:        }
                   1639:        bno = dtogd(fs, bno);
                   1640:        if (size == fs->fs_bsize) {
                   1641:                free = ffs_isblock(fs, cg_blksfree(cgp), fragstoblks(fs, bno));
                   1642:        } else {
                   1643:                frags = numfrags(fs, size);
                   1644:                for (free = 0, i = 0; i < frags; i++)
                   1645:                        if (isset(cg_blksfree(cgp), bno + i))
                   1646:                                free++;
                   1647:                if (free != 0 && free != frags)
                   1648:                        panic("checkblk: partially free fragment");
                   1649:        }
                   1650: #if REV_ENDIAN_FS
                   1651:        if (rev_endian)
                   1652:                byte_swap_cgout(cgp,fs);
                   1653: #endif /* REV_ENDIAN_FS */
                   1654:        brelse(bp);
                   1655:        return (!free);
                   1656: }
                   1657: #endif /* DIAGNOSTIC */
                   1658: 
                   1659: /*
                   1660:  * Free an inode.
                   1661:  *
                   1662:  * The specified inode is placed back in the free map.
                   1663:  */
                   1664: int
                   1665: ffs_vfree(ap)
                   1666:        struct vop_vfree_args /* {
                   1667:                struct vnode *a_pvp;
                   1668:                ino_t a_ino;
                   1669:                int a_mode;
                   1670:        } */ *ap;
                   1671: {
                   1672:        register struct fs *fs;
                   1673:        register struct cg *cgp;
                   1674:        register struct inode *pip;
                   1675:        ino_t ino = ap->a_ino;
                   1676:        struct buf *bp;
                   1677:        int error, cg;
                   1678: #if REV_ENDIAN_FS
                   1679:        struct vnode *vp=ap->a_pvp;
                   1680:        struct mount *mp=vp->v_mount;
                   1681:        int rev_endian=(mp->mnt_flag & MNT_REVEND);
                   1682: #endif /* REV_ENDIAN_FS */
                   1683: 
                   1684:        pip = VTOI(ap->a_pvp);
                   1685:        fs = pip->i_fs;
                   1686:        if ((u_int)ino >= fs->fs_ipg * fs->fs_ncg)
                   1687:                panic("ifree: range: dev = 0x%x, ino = %d, fs = %s\n",
                   1688:                    pip->i_dev, ino, fs->fs_fsmnt);
                   1689:        cg = ino_to_cg(fs, ino);
                   1690:        error = bread(pip->i_devvp, fsbtodb(fs, cgtod(fs, cg)),
                   1691:                (int)fs->fs_cgsize, NOCRED, &bp);
                   1692:        if (error) {
                   1693:                brelse(bp);
                   1694:                return (0);
                   1695:        }
                   1696:        cgp = (struct cg *)bp->b_data;
                   1697: #if REV_ENDIAN_FS
                   1698:        if (rev_endian)
                   1699:                byte_swap_cgin(cgp,fs);
                   1700: #endif /* REV_ENDIAN_FS */
                   1701:        if (!cg_chkmagic(cgp)) {
                   1702: #if REV_ENDIAN_FS
                   1703:                if (rev_endian)
                   1704:                        byte_swap_cgout(cgp,fs);
                   1705: #endif /* REV_ENDIAN_FS */
                   1706:                brelse(bp);
                   1707:                return (0);
                   1708:        }
                   1709:        cgp->cg_time = time.tv_sec;
                   1710:        ino %= fs->fs_ipg;
                   1711:        if (isclr(cg_inosused(cgp), ino)) {
                   1712:                printf("dev = 0x%x, ino = %d, fs = %s\n",
                   1713:                    pip->i_dev, ino, fs->fs_fsmnt);
                   1714:                if (fs->fs_ronly == 0)
                   1715:                        panic("ifree: freeing free inode");
                   1716:        }
                   1717:        clrbit(cg_inosused(cgp), ino);
                   1718:        if (ino < cgp->cg_irotor)
                   1719:                cgp->cg_irotor = ino;
                   1720:        cgp->cg_cs.cs_nifree++;
                   1721:        fs->fs_cstotal.cs_nifree++;
                   1722:        fs->fs_cs(fs, cg).cs_nifree++;
                   1723:        if ((ap->a_mode & IFMT) == IFDIR) {
                   1724:                cgp->cg_cs.cs_ndir--;
                   1725:                fs->fs_cstotal.cs_ndir--;
                   1726:                fs->fs_cs(fs, cg).cs_ndir--;
                   1727:        }
                   1728:        fs->fs_fmod = 1;
                   1729: #if REV_ENDIAN_FS
                   1730:        if (rev_endian)
                   1731:                byte_swap_cgout(cgp,fs);
                   1732: #endif /* REV_ENDIAN_FS */
                   1733:        bdwrite(bp);
                   1734:        return (0);
                   1735: }
                   1736: 
                   1737: /*
                   1738:  * Find a block of the specified size in the specified cylinder group.
                   1739:  *
                   1740:  * It is a panic if a request is made to find a block if none are
                   1741:  * available.
                   1742:  */
                   1743: static ufs_daddr_t
                   1744: ffs_mapsearch(fs, cgp, bpref, allocsiz)
                   1745:        register struct fs *fs;
                   1746:        register struct cg *cgp;
                   1747:        ufs_daddr_t bpref;
                   1748:        int allocsiz;
                   1749: {
                   1750:        ufs_daddr_t bno;
                   1751:        int start, len, loc, i;
                   1752:        int blk, field, subfield, pos;
                   1753: 
                   1754:        /*
                   1755:         * find the fragment by searching through the free block
                   1756:         * map for an appropriate bit pattern
                   1757:         */
                   1758:        if (bpref)
                   1759:                start = dtogd(fs, bpref) / NBBY;
                   1760:        else
                   1761:                start = cgp->cg_frotor / NBBY;
                   1762:        len = howmany(fs->fs_fpg, NBBY) - start;
                   1763:        loc = scanc((u_int)len, (u_char *)&cg_blksfree(cgp)[start],
                   1764:                (u_char *)fragtbl[fs->fs_frag],
                   1765:                (u_char)(1 << (allocsiz - 1 + (fs->fs_frag % NBBY))));
                   1766:        if (loc == 0) {
                   1767:                len = start + 1;
                   1768:                start = 0;
                   1769:                loc = scanc((u_int)len, (u_char *)&cg_blksfree(cgp)[0],
                   1770:                        (u_char *)fragtbl[fs->fs_frag],
                   1771:                        (u_char)(1 << (allocsiz - 1 + (fs->fs_frag % NBBY))));
                   1772:                if (loc == 0) {
                   1773:                        printf("start = %d, len = %d, fs = %s\n",
                   1774:                            start, len, fs->fs_fsmnt);
                   1775:                        panic("ffs_alloccg: map corrupted");
                   1776:                        /* NOTREACHED */
                   1777:                }
                   1778:        }
                   1779:        bno = (start + len - loc) * NBBY;
                   1780:        cgp->cg_frotor = bno;
                   1781:        /*
                   1782:         * found the byte in the map
                   1783:         * sift through the bits to find the selected frag
                   1784:         */
                   1785:        for (i = bno + NBBY; bno < i; bno += fs->fs_frag) {
                   1786:                blk = blkmap(fs, cg_blksfree(cgp), bno);
                   1787:                blk <<= 1;
                   1788:                field = around[allocsiz];
                   1789:                subfield = inside[allocsiz];
                   1790:                for (pos = 0; pos <= fs->fs_frag - allocsiz; pos++) {
                   1791:                        if ((blk & field) == subfield)
                   1792:                                return (bno + pos);
                   1793:                        field <<= 1;
                   1794:                        subfield <<= 1;
                   1795:                }
                   1796:        }
                   1797:        printf("bno = %d, fs = %s\n", bno, fs->fs_fsmnt);
                   1798:        panic("ffs_alloccg: block not in map");
                   1799:        return (-1);
                   1800: }
                   1801: 
                   1802: /*
                   1803:  * Update the cluster map because of an allocation or free.
                   1804:  *
                   1805:  * Cnt == 1 means free; cnt == -1 means allocating.
                   1806:  */
                   1807: ffs_clusteracct(fs, cgp, blkno, cnt)
                   1808:        struct fs *fs;
                   1809:        struct cg *cgp;
                   1810:        ufs_daddr_t blkno;
                   1811:        int cnt;
                   1812: {
                   1813:        int32_t *sump;
                   1814:        int32_t *lp;
                   1815:        u_char *freemapp, *mapp;
                   1816:        int i, start, end, forw, back, map, bit;
                   1817: 
                   1818:        if (fs->fs_contigsumsize <= 0)
                   1819:                return;
                   1820:        freemapp = cg_clustersfree(cgp);
                   1821:        sump = cg_clustersum(cgp);
                   1822:        /*
                   1823:         * Allocate or clear the actual block.
                   1824:         */
                   1825:        if (cnt > 0)
                   1826:                setbit(freemapp, blkno);
                   1827:        else
                   1828:                clrbit(freemapp, blkno);
                   1829:        /*
                   1830:         * Find the size of the cluster going forward.
                   1831:         */
                   1832:        start = blkno + 1;
                   1833:        end = start + fs->fs_contigsumsize;
                   1834:        if (end >= cgp->cg_nclusterblks)
                   1835:                end = cgp->cg_nclusterblks;
                   1836:        mapp = &freemapp[start / NBBY];
                   1837:        map = *mapp++;
                   1838:        bit = 1 << (start % NBBY);
                   1839:        for (i = start; i < end; i++) {
                   1840:                if ((map & bit) == 0)
                   1841:                        break;
                   1842:                if ((i & (NBBY - 1)) != (NBBY - 1)) {
                   1843:                        bit <<= 1;
                   1844:                } else {
                   1845:                        map = *mapp++;
                   1846:                        bit = 1;
                   1847:                }
                   1848:        }
                   1849:        forw = i - start;
                   1850:        /*
                   1851:         * Find the size of the cluster going backward.
                   1852:         */
                   1853:        start = blkno - 1;
                   1854:        end = start - fs->fs_contigsumsize;
                   1855:        if (end < 0)
                   1856:                end = -1;
                   1857:        mapp = &freemapp[start / NBBY];
                   1858:        map = *mapp--;
                   1859:        bit = 1 << (start % NBBY);
                   1860:        for (i = start; i > end; i--) {
                   1861:                if ((map & bit) == 0)
                   1862:                        break;
                   1863:                if ((i & (NBBY - 1)) != 0) {
                   1864:                        bit >>= 1;
                   1865:                } else {
                   1866:                        map = *mapp--;
                   1867:                        bit = 1 << (NBBY - 1);
                   1868:                }
                   1869:        }
                   1870:        back = start - i;
                   1871:        /*
                   1872:         * Account for old cluster and the possibly new forward and
                   1873:         * back clusters.
                   1874:         */
                   1875:        i = back + forw + 1;
                   1876:        if (i > fs->fs_contigsumsize)
                   1877:                i = fs->fs_contigsumsize;
                   1878:        sump[i] += cnt;
                   1879:        if (back > 0)
                   1880:                sump[back] -= cnt;
                   1881:        if (forw > 0)
                   1882:                sump[forw] -= cnt;
                   1883:        /*
                   1884:         * Update cluster summary information.
                   1885:         */
                   1886:        lp = &sump[fs->fs_contigsumsize];
                   1887:        for (i = fs->fs_contigsumsize; i > 0; i--)
                   1888:                if (*lp-- > 0)
                   1889:                        break;
                   1890:        fs->fs_maxcluster[cgp->cg_cgx] = i;
                   1891: }
                   1892: 
                   1893: /*
                   1894:  * Fserr prints the name of a file system with an error diagnostic.
                   1895:  * 
                   1896:  * The form of the error message is:
                   1897:  *     fs: error message
                   1898:  */
                   1899: static void
                   1900: ffs_fserr(fs, uid, cp)
                   1901:        struct fs *fs;
                   1902:        u_int uid;
                   1903:        char *cp;
                   1904: {
                   1905: 
                   1906:        log(LOG_ERR, "uid %d on %s: %s\n", uid, fs->fs_fsmnt, cp);
                   1907: }

unix.superglobalmegacorp.com

This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.