Annotation of GNUtools/cctools/as/hash.c, revision 1.1

1.1     ! root        1: /* hash.c - hash table lookup strings -
        !             2:    Copyright (C) 1987 Free Software Foundation, Inc.
        !             3: 
        !             4: This file is part of GAS, the GNU Assembler.
        !             5: 
        !             6: GAS is free software; you can redistribute it and/or modify
        !             7: it under the terms of the GNU General Public License as published by
        !             8: the Free Software Foundation; either version 1, or (at your option)
        !             9: any later version.
        !            10: 
        !            11: GAS is distributed in the hope that it will be useful,
        !            12: but WITHOUT ANY WARRANTY; without even the implied warranty of
        !            13: MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
        !            14: GNU General Public License for more details.
        !            15: 
        !            16: You should have received a copy of the GNU General Public License
        !            17: along with GAS; see the file COPYING.  If not, write to
        !            18: the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
        !            19: 
        !            20: /*
        !            21:  * BUGS, GRIPES, APOLOGIA etc.
        !            22:  *
        !            23:  * A typical user doesn't need ALL this: I intend to make a library out
        !            24:  * of it one day - Dean Elsner.
        !            25:  * Also, I want to change the definition of a symbol to (address,length)
        !            26:  * so I can put arbitrary binary in the names stored. [see hsh.c for that]
        !            27:  *
        !            28:  * This slime is common coupled inside the module. Com-coupling (and other
        !            29:  * vandalism) was done to speed running time. The interfaces at the
        !            30:  * module's edges are adequately clean.
        !            31:  *
        !            32:  * There is no way to (a) run a test script through this heap and (b)
        !            33:  * compare results with previous scripts, to see if we have broken any
        !            34:  * code. Use GNU (f)utilities to do this. A few commands assist test.
        !            35:  * The testing is awkward: it tries to be both batch & interactive.
        !            36:  * For now, interactive rules!
        !            37:  */
        !            38: 
        !            39: /*
        !            40:  *  The idea is to implement a symbol table. A test jig is here.
        !            41:  *  Symbols are arbitrary strings; they can't contain '\0'.
        !            42:  *     [See hsh.c for a more general symbol flavour.]
        !            43:  *  Each symbol is associated with a char*, which can point to anything
        !            44:  *  you want, allowing an arbitrary property list for each symbol.
        !            45:  *
        !            46:  *  The basic operations are:
        !            47:  *
        !            48:  *    new                     creates symbol table, returns handle
        !            49:  *    find (symbol)           returns char*
        !            50:  *    insert (symbol,char*)   error if symbol already in table
        !            51:  *    delete (symbol)         returns char* if symbol was in table
        !            52:  *    apply                   so you can delete all symbols before die()
        !            53:  *    die                     destroy symbol table (free up memory)
        !            54:  *
        !            55:  *  Supplementary functions include:
        !            56:  *
        !            57:  *    say                     how big? what % full?
        !            58:  *    replace (symbol,newval) report previous value
        !            59:  *    jam (symbol,value)      assert symbol:=value
        !            60:  *
        !            61:  *  You, the caller, have control over errors: this just reports them.
        !            62:  *
        !            63:  *  This package requires malloc(), free().
        !            64:  *  Malloc(size) returns NULL or address of char[size].
        !            65:  *  Free(address) frees same.
        !            66:  */
        !            67: 
        !            68: /*
        !            69:  *  The code and its structures are re-enterent.
        !            70:  *  Before you do anything else, you must call hash_new() which will
        !            71:  *  return the address of a hash-table-control-block (or NULL if there
        !            72:  *  is not enough memory). You then use this address as a handle of the
        !            73:  *  symbol table by passing it to all the other hash_...() functions.
        !            74:  *  The only approved way to recover the memory used by the symbol table
        !            75:  *  is to call hash_die() with the handle of the symbol table.
        !            76:  *
        !            77:  *  Before you call hash_die() you normally delete anything pointed to
        !            78:  *  by individual symbols. After hash_die() you can't use that symbol
        !            79:  *  table again.
        !            80:  *
        !            81:  *  The char* you associate with a symbol may not be NULL (0) because
        !            82:  *  NULL is returned whenever a symbol is not in the table. Any other
        !            83:  *  value is OK, except DELETED, #defined below.
        !            84:  *
        !            85:  *  When you supply a symbol string for insertion, YOU MUST PRESERVE THE
        !            86:  *  STRING until that symbol is deleted from the table. The reason is that
        !            87:  *  only the address you supply, NOT the symbol string itself, is stored
        !            88:  *  in the symbol table.
        !            89:  *
        !            90:  *  You may delete and add symbols arbitrarily.
        !            91:  *  Any or all symbols may have the same 'value' (char *). In fact, these
        !            92:  *  routines don't do anything with your symbol values.
        !            93:  *
        !            94:  *  You have no right to know where the symbol:char* mapping is stored,
        !            95:  *  because it moves around in memory; also because we may change how it
        !            96:  *  works and we don't want to break your code do we? However the handle
        !            97:  *  (address of struct hash_control) is never changed in
        !            98:  *  the life of the symbol table.
        !            99:  *
        !           100:  *  What you CAN find out about a symbol table is:
        !           101:  *    how many slots are in the hash table?
        !           102:  *    how many slots are filled with symbols?
        !           103:  *    (total hashes,collisions) for (reads,writes) (*)
        !           104:  *  All of the above values vary in time.
        !           105:  *  (*) some of these numbers will not be meaningful if we change the
        !           106:  *  internals.
        !           107:  */
        !           108: 
        !           109: /*
        !           110:  *  I N T E R N A L
        !           111:  *
        !           112:  *  Hash table is an array of hash_entries; each entry is a pointer to a
        !           113:  *  a string and a user-supplied value 1 char* wide.
        !           114:  *
        !           115:  *  The array always has 2 ** n elements, n>0, n integer.
        !           116:  *  There is also a 'wall' entry after the array, which is always empty
        !           117:  *  and acts as a sentinel to stop running off the end of the array.
        !           118:  *  When the array gets too full, we create a new array twice as large
        !           119:  *  and re-hash the symbols into the new array, then forget the old array.
        !           120:  *  (Of course, we copy the values into the new array before we junk the
        !           121:  *  old array!)
        !           122:  *
        !           123:  */
        !           124: 
        !           125: #include <stdio.h>
        !           126: #include <stdlib.h>
        !           127: #include <ctype.h>
        !           128: #include "hash.h"
        !           129: #include "xmalloc.h"
        !           130: #include "messages.h"
        !           131: 
        !           132: #define TRUE           (1)
        !           133: #define FALSE          (0)
        !           134: #define min(a, b)      ((a) < (b) ? (a) : (b))
        !           135: 
        !           136: 
        !           137: #define DELETED     ((char *)1)        /* guarenteed invalid address */
        !           138: #define START_POWER    (11)    /* power of two: size of new hash table *//* JF was 6 */
        !           139: /* JF These next two aren't used any more. */
        !           140: /* #define START_SIZE    (64)  / * 2 ** START_POWER */
        !           141: /* #define START_FULL    (32)      / * number of entries before table expands */
        !           142: #define islive(ptr) (ptr->hash_string && ptr->hash_string!=DELETED)
        !           143:                                /* above TRUE if a symbol is in entry @ ptr */
        !           144: 
        !           145: #define STAT_SIZE      (0)      /* number of slots in hash table */
        !           146:                                /* the wall does not count here */
        !           147:                                /* we expect this is always a power of 2 */
        !           148: #define STAT_ACCESS    (1)     /* number of hash_ask()s */
        !           149: #define STAT__READ     (0)      /* reading */
        !           150: #define STAT__WRITE    (1)      /* writing */
        !           151: #define STAT_COLLIDE   (3)     /* number of collisions (total) */
        !           152:                                /* this may exceed STAT_ACCESS if we have */
        !           153:                                /* lots of collisions/access */
        !           154: #define STAT_USED      (5)     /* slots used right now */
        !           155: #define STATLENGTH     (6)     /* size of statistics block */
        !           156: #if STATLENGTH != HASH_STATLENGTH
        !           157: Panic! Please make #include "stat.h" agree with previous definitions!
        !           158: #endif
        !           159: 
        !           160: /* #define SUSPECT to do runtime checks */
        !           161: /* #define TEST to be a test jig for hash...() */
        !           162: 
        !           163: #ifdef TEST                    /* TEST: use smaller hash table */
        !           164: #undef  START_POWER
        !           165: #define START_POWER (3)
        !           166: #undef  START_SIZE
        !           167: #define START_SIZE  (8)
        !           168: #undef  START_FULL
        !           169: #define START_FULL  (4)
        !           170: static void hash_die(
        !           171:     struct hash_control *handle);
        !           172: static void hash_say(
        !           173:     struct hash_control *handle,
        !           174:     int buffer[/*bufsiz*/],
        !           175:     int bufsiz);
        !           176: static char *hash_delete(              /* previous value         */
        !           177:     struct hash_control *handle,
        !           178:     char *string);
        !           179: static char *hash_replace(             /* previous value         */
        !           180:     struct hash_control *handle,
        !           181:     char *string,
        !           182:     char *value);
        !           183: #endif /* TEST */
        !           184: 
        !           185: /*------------------ plan ---------------------------------- i = internal
        !           186: 
        !           187: struct hash_control * c;
        !           188: struct hash_entry   * e;                                                    i
        !           189: int                   b[z];     buffer for statistics
        !           190:                       z         size of b
        !           191: char                * s;        symbol string (address) [ key ]
        !           192: char                * v;        value string (address)  [datum]
        !           193: boolean               f;        TRUE if we found s in hash table            i
        !           194: char                * t;        error string; "" means OK
        !           195: int                   a;        access type [0...n)                         i
        !           196: 
        !           197: c=hash_new       ()             create new hash_control
        !           198: 
        !           199: hash_die         (c)            destroy hash_control (and hash table)
        !           200:                                 table should be empty.
        !           201:                                 doesn't check if table is empty.
        !           202:                                 c has no meaning after this.
        !           203: 
        !           204: hash_say         (c,b,z)        report statistics of hash_control.
        !           205:                                 also report number of available statistics.
        !           206: 
        !           207: v=hash_delete    (c,s)          delete symbol, return old value if any.
        !           208:     ask()                       NULL means no old value.
        !           209:     f
        !           210: 
        !           211: v=hash_replace   (c,s,v)        replace old value of s with v.
        !           212:     ask()                       NULL means no old value: no table change.
        !           213:     f
        !           214: 
        !           215: t=hash_insert    (c,s,v)        insert (s,v) in c.
        !           216:     ask()                       return error string.
        !           217:     f                           it is an error to insert if s is already
        !           218:                                 in table.
        !           219:                                 if any error, c is unchanged.
        !           220: 
        !           221: t=hash_jam       (c,s,v)        assert that new value of s will be v.       i
        !           222:     ask()                       it may decide to GROW the table.            i
        !           223:     f                                                                       i
        !           224:     grow()                                                                  i
        !           225: t=hash_grow      (c)            grow the hash table.                        i
        !           226:     jam()                       will invoke JAM.                            i
        !           227: 
        !           228: ?=hash_apply     (c,y)          apply y() to every symbol in c.
        !           229:     y                           evtries visited in 'unspecified' order.
        !           230: 
        !           231: v=hash_find      (c,s)          return value of s, or NULL if s not in c.
        !           232:     ask()
        !           233:     f
        !           234: 
        !           235: f,e=hash_ask()   (c,s,a)        return slot where s SHOULD live.            i
        !           236:     code()                      maintain collision stats in c.              i
        !           237: 
        !           238: .=hash_code      (c,s)          compute hash-code for s,                    i
        !           239:                                 from parameters of c.                       i
        !           240: 
        !           241: */
        !           242: 
        !           243: static char hash_found;                /* returned by hash_ask() to stop extra */
        !           244:                                /* testing. hash_ask() wants to return both */
        !           245:                                /* a slot and a status. This is the status. */
        !           246:                                /* TRUE: found symbol */
        !           247:                                /* FALSE: absent: empty or deleted slot */
        !           248:                                /* Also returned by hash_jam(). */
        !           249:                                /* TRUE: we replaced a value */
        !           250:                                /* FALSE: we inserted a value */
        !           251: 
        !           252: static struct hash_entry *hash_ask(
        !           253:     struct hash_control *handle,
        !           254:     char *string,
        !           255:     int access);
        !           256: static int hash_code(
        !           257:     struct hash_control *handle,
        !           258:     char *string);
        !           259: static char *hash_grow(
        !           260:     struct hash_control *handle);
        !           261: 
        !           262: /*
        !           263:  *             h a s h _ n e w ( )
        !           264:  *
        !           265:  */
        !           266: struct hash_control *
        !           267: hash_new(void)                 /* create a new hash table */
        !           268:                                /* return NULL if failed */
        !           269:                                /* return handle (address of struct hash) */
        !           270: {
        !           271:   register struct hash_control * retval;
        !           272:   register struct hash_entry *   room; /* points to hash table */
        !           273:   register struct hash_entry *   wall;
        !           274:   register struct hash_entry *   entry;
        !           275:   register int *                 ip;   /* scan stats block of struct hash_control */
        !           276:   register int *                 nd;   /* limit of stats block */
        !           277: 
        !           278:   if ((room = (struct hash_entry *) malloc( sizeof(struct hash_entry)*((1<<START_POWER) + 1) ) ))
        !           279:                                /* +1 for the wall entry */
        !           280:     {
        !           281:       if ((retval = (struct hash_control *) malloc(sizeof(struct hash_control)) ))
        !           282:        {
        !           283:          nd = retval->hash_stat + STATLENGTH;
        !           284:          for (ip=retval->hash_stat; ip<nd; ip++)
        !           285:            {
        !           286:              *ip = 0;
        !           287:            }
        !           288: 
        !           289:          retval -> hash_stat[STAT_SIZE]  = 1<<START_POWER;
        !           290:          retval -> hash_mask             = (1<<START_POWER) - 1;
        !           291:          retval -> hash_sizelog          = START_POWER;
        !           292:                                /* works for 1's compl ok */
        !           293:          retval -> hash_where            = room;
        !           294:          retval -> hash_wall             =
        !           295:            wall                          = room + (1<<START_POWER);
        !           296:          retval -> hash_full             = (1<<START_POWER)/2;
        !           297:          for (entry=room; entry<=wall; entry++)
        !           298:            {
        !           299:              entry->hash_string = NULL;
        !           300:            }
        !           301:        }
        !           302:     }
        !           303:   else
        !           304:     {
        !           305:       retval = NULL;           /* no room for table: fake a failure */
        !           306:     }
        !           307:   return(retval);              /* return NULL or set-up structs */
        !           308: }
        !           309: 
        !           310: #ifdef TEST
        !           311: /*
        !           312:  *           h a s h _ d i e ( )
        !           313:  *
        !           314:  * Table should be empty, but this is not checked.
        !           315:  * To empty the table, try hash_apply()ing a symbol deleter.
        !           316:  * Return to free memory both the hash table and it's control
        !           317:  * block.
        !           318:  * 'handle' has no meaning after this function.
        !           319:  * No errors are recoverable.
        !           320:  */
        !           321: static
        !           322: void
        !           323: hash_die(
        !           324: struct hash_control *handle)
        !           325: {
        !           326:   free((char *)handle->hash_where);
        !           327:   free((char *)handle);
        !           328: }
        !           329: 
        !           330: /*
        !           331:  *           h a s h _ s a y ( )
        !           332:  *
        !           333:  * Return the size of the statistics table, and as many statistics as
        !           334:  * we can until either (a) we have run out of statistics or (b) caller
        !           335:  * has run out of buffer.
        !           336:  * NOTE: hash_say treats all statistics alike.
        !           337:  * These numbers may change with time, due to insertions, deletions
        !           338:  * and expansions of the table.
        !           339:  * The first "statistic" returned is the length of hash_stat[].
        !           340:  * Then contents of hash_stat[] are read out (in ascending order)
        !           341:  * until your buffer or hash_stat[] is exausted.
        !           342:  */
        !           343: static
        !           344: void
        !           345: hash_say(
        !           346: struct hash_control *handle,
        !           347: int buffer[/*bufsiz*/],
        !           348: int bufsiz)
        !           349: {
        !           350:   register int * nd;                   /* limit of statistics block */
        !           351:   register int * ip;                   /* scan statistics */
        !           352: 
        !           353:   ip = handle -> hash_stat;
        !           354:   nd = ip + min(bufsiz-1,STATLENGTH);
        !           355:   if (bufsiz>0)                        /* trust nothing! bufsiz<=0 is dangerous */
        !           356:     {
        !           357:       *buffer++ = STATLENGTH;
        !           358:       for (; ip<nd; ip++,buffer++)
        !           359:        {
        !           360:          *buffer = *ip;
        !           361:        }
        !           362:     }
        !           363: }
        !           364: 
        !           365: /*
        !           366:  *           h a s h _ d e l e t e ( )
        !           367:  *
        !           368:  * Try to delete a symbol from the table.
        !           369:  * If it was there, return its value (and adjust STAT_USED).
        !           370:  * Otherwise, return NULL.
        !           371:  * Anyway, the symbol is not present after this function.
        !           372:  *
        !           373:  */
        !           374: static
        !           375: char *                         /* NULL if string not in table, else */
        !           376: hash_delete(                   /* returns value of deleted symbol */
        !           377: struct hash_control *handle,
        !           378: char *string)
        !           379: {
        !           380:   register char *                   retval; /* NULL if string not in table */
        !           381:   register struct hash_entry *      entry; /* NULL or entry of this symbol */
        !           382: 
        !           383:   entry = hash_ask(handle,string,STAT__WRITE);
        !           384:   if (hash_found)
        !           385:     {
        !           386:          retval = entry -> hash_value;
        !           387:          entry -> hash_string = DELETED; /* mark as deleted */
        !           388:          handle -> hash_stat[STAT_USED] -= 1; /* slots-in-use count */
        !           389: #ifdef SUSPECT
        !           390:          if (handle->hash_stat[STAT_USED]<0)
        !           391:            {
        !           392: #ifdef NeXT
        !           393:              as_fatal("hash_delete");
        !           394: #else
        !           395:              error("hash_delete");
        !           396: #endif
        !           397:            }
        !           398: #endif /* def SUSPECT */
        !           399:     }
        !           400:   else
        !           401:     {
        !           402:       retval = NULL;
        !           403:     }
        !           404:   return(retval);
        !           405: }
        !           406: 
        !           407: /*
        !           408:  *                   h a s h _ r e p l a c e ( )
        !           409:  *
        !           410:  * Try to replace the old value of a symbol with a new value.
        !           411:  * Normally return the old value.
        !           412:  * Return NULL and don't change the table if the symbol is not already
        !           413:  * in the table.
        !           414:  */
        !           415: static
        !           416: char *
        !           417: hash_replace(
        !           418: struct hash_control *handle,
        !           419: char *string,
        !           420: char *value)
        !           421: {
        !           422:   register struct hash_entry *      entry;
        !           423:   register char *                   retval;
        !           424: 
        !           425:   entry = hash_ask(handle,string,STAT__WRITE);
        !           426:   if (hash_found)
        !           427:     {
        !           428:       retval = entry -> hash_value;
        !           429:       entry -> hash_value = value;
        !           430:     }
        !           431:   else
        !           432:     {
        !           433:       retval = NULL;
        !           434:     }
        !           435:   ;
        !           436:   return (retval);
        !           437: }
        !           438: #endif /* TEST */
        !           439: 
        !           440: /*
        !           441:  *                   h a s h _ i n s e r t ( )
        !           442:  *
        !           443:  * Insert a (symbol-string, value) into the hash table.
        !           444:  * Return an error string, "" means OK.
        !           445:  * It is an 'error' to insert an existing symbol.
        !           446:  */
        !           447: char *                         /* return error string */
        !           448: hash_insert(
        !           449: struct hash_control *handle,
        !           450: char *string,
        !           451: char *value)
        !           452: {
        !           453:   register struct hash_entry * entry;
        !           454:   register char *              retval;
        !           455: 
        !           456:   retval = "";
        !           457:   if (handle->hash_stat[STAT_USED] > handle->hash_full)
        !           458:     {
        !           459:       retval = hash_grow(handle);
        !           460:     }
        !           461:   if ( ! * retval)
        !           462:     {
        !           463:       entry = hash_ask(handle,string,STAT__WRITE);
        !           464:       if (hash_found)
        !           465:        {
        !           466:          retval = "exists";
        !           467:        }
        !           468:       else
        !           469:        {
        !           470:          entry -> hash_value  = value;
        !           471:          entry -> hash_string = string;
        !           472:          handle-> hash_stat[STAT_USED]  += 1;
        !           473:        }
        !           474:     }
        !           475:   return(retval);
        !           476: }
        !           477: 
        !           478: /*
        !           479:  *               h a s h _ j a m ( )
        !           480:  *
        !           481:  * Regardless of what was in the symbol table before, after hash_jam()
        !           482:  * the named symbol has the given value. The symbol is either inserted or
        !           483:  * (its value is) relpaced.
        !           484:  * An error message string is returned, "" means OK.
        !           485:  *
        !           486:  * WARNING: this may decide to grow the hashed symbol table.
        !           487:  * To do this, we call hash_grow(), WHICH WILL recursively CALL US.
        !           488:  *
        !           489:  * We report status internally: hash_found is TRUE if we replaced, but
        !           490:  * false if we inserted.
        !           491:  */
        !           492: char *
        !           493: hash_jam(
        !           494: struct hash_control *handle,
        !           495: char *string,
        !           496: char *value)
        !           497: {
        !           498:   register char *                   retval;
        !           499:   register struct hash_entry *      entry;
        !           500: 
        !           501:   retval = "";
        !           502:   if (handle->hash_stat[STAT_USED] > handle->hash_full)
        !           503:     {
        !           504:       retval = hash_grow(handle);
        !           505:     }
        !           506:   if (! * retval)
        !           507:     {
        !           508:       entry = hash_ask(handle,string,STAT__WRITE);
        !           509:       if ( ! hash_found)
        !           510:        {
        !           511:          entry -> hash_string = string;
        !           512:          handle->hash_stat[STAT_USED] += 1;
        !           513:        }
        !           514:       entry -> hash_value = value;
        !           515:     }
        !           516:   return(retval);
        !           517: }
        !           518: 
        !           519: /*
        !           520:  *               h a s h _ g r o w ( )
        !           521:  *
        !           522:  * Grow a new (bigger) hash table from the old one.
        !           523:  * We choose to double the hash table's size.
        !           524:  * Return a human-scrutible error string: "" if OK.
        !           525:  * Warning! This uses hash_jam(), which had better not recurse
        !           526:  * back here! Hash_jam() conditionally calls us, but we ALWAYS
        !           527:  * call hash_jam()!
        !           528:  * Internal.
        !           529:  */
        !           530: static
        !           531: char *
        !           532: hash_grow(             /* make a hash table grow */
        !           533: struct hash_control *handle)
        !           534: {
        !           535:   register struct hash_entry *      newwall;
        !           536:   register struct hash_entry *      newwhere;
        !           537:   struct hash_entry *      newtrack;
        !           538:   register struct hash_entry *      oldtrack;
        !           539:   register struct hash_entry *      oldwhere;
        !           540:   register struct hash_entry *      oldwall;
        !           541:   register int                      temp;
        !           542:   int                      newsize;
        !           543:   char *                   string;
        !           544:   char *                   retval;
        !           545: #ifdef SUSPECT
        !           546:   int                      oldused;
        !           547: #endif
        !           548: 
        !           549:   /*
        !           550:    * capture info about old hash table
        !           551:    */
        !           552:   oldwhere = handle -> hash_where;
        !           553:   oldwall  = handle -> hash_wall;
        !           554: #ifdef SUSPECT
        !           555:   oldused  = handle -> hash_stat[STAT_USED];
        !           556: #endif
        !           557:   /*
        !           558:    * attempt to get enough room for a hash table twice as big
        !           559:    */
        !           560:   temp = handle->hash_stat[STAT_SIZE];
        !           561:   if ((newwhere = (struct hash_entry *) xmalloc((long)((temp+temp+1)*sizeof(struct hash_entry)))))
        !           562:                                /* +1 for wall slot */
        !           563:     {
        !           564:       retval = "";             /* assume success until proven otherwise */
        !           565:       /*
        !           566:        * have enough room: now we do all the work.
        !           567:        * double the size of everything in handle,
        !           568:        * note: hash_mask frob works for 1's & for 2's complement machines
        !           569:        */
        !           570:       handle->hash_mask              = handle->hash_mask + handle->hash_mask + 1;
        !           571:       handle->hash_stat[STAT_SIZE] <<= 1;
        !           572:       newsize                        = handle->hash_stat[STAT_SIZE];
        !           573:       handle->hash_where             = newwhere;
        !           574:       handle->hash_full            <<= 1;
        !           575:       handle->hash_sizelog         += 1;
        !           576:       handle->hash_stat[STAT_USED]   = 0;
        !           577:       handle->hash_wall              =
        !           578:       newwall                        = newwhere + newsize;
        !           579:       /*
        !           580:        * set all those pesky new slots to vacant.
        !           581:        */
        !           582:       for (newtrack=newwhere; newtrack < newwall; newtrack++)
        !           583:        {
        !           584:          newtrack -> hash_string = NULL;
        !           585:        }
        !           586:       /*
        !           587:        * we will do a scan of the old table, the hard way, using the
        !           588:        * new control block to re-insert the data into new hash table.
        !           589:        */
        !           590:       handle -> hash_stat[STAT_USED] = 0;      /* inserts will bump it up to correct */
        !           591:       for (oldtrack=oldwhere; oldtrack < oldwall; oldtrack++)
        !           592:        {
        !           593:          if ( (string=oldtrack->hash_string) && string!=DELETED )
        !           594:            {
        !           595:              if ( * (retval = hash_jam(handle,string,oldtrack->hash_value) ) )
        !           596:                {
        !           597:                  break;
        !           598:                }
        !           599:            }
        !           600:        }
        !           601: #ifdef SUSPECT
        !           602:       if ( !*retval && handle->hash_stat[STAT_USED] != oldused)
        !           603:        {
        !           604:          retval = "hash_used";
        !           605:        }
        !           606: #endif
        !           607:       if (!*retval)
        !           608:        {
        !           609:          /*
        !           610:           * we have a completely faked up control block.
        !           611:           * return the old hash table.
        !           612:           */
        !           613:          free((char *)oldwhere);
        !           614:          /*
        !           615:           * Here with success. retval is already "".
        !           616:           */
        !           617:        }
        !           618:     }
        !           619:   else
        !           620:     {
        !           621:       retval = "no room";
        !           622:     }
        !           623:   return(retval);
        !           624: }
        !           625: 
        !           626: /*
        !           627:  *          h a s h _ a p p l y ( )
        !           628:  *
        !           629:  * Use this to scan each entry in symbol table.
        !           630:  * For each symbol, this calls (applys) a nominated function supplying the
        !           631:  * symbol's value (and the symbol's name).
        !           632:  * The idea is you use this to destroy whatever is associted with
        !           633:  * any values in the table BEFORE you destroy the table with hash_die.
        !           634:  * Of course, you can use it for other jobs; whenever you need to
        !           635:  * visit all extant symbols in the table.
        !           636:  *
        !           637:  * We choose to have a call-you-back idea for two reasons:
        !           638:  *  asthetic: it is a neater idea to use apply than an explicit loop
        !           639:  *  sensible: if we ever had to grow the symbol table (due to insertions)
        !           640:  *            then we would lose our place in the table when we re-hashed
        !           641:  *            symbols into the new table in a different order.
        !           642:  *
        !           643:  * The order symbols are visited depends entirely on the hashing function.
        !           644:  * Whenever you insert a (symbol, value) you risk expanding the table. If
        !           645:  * you do expand the table, then the hashing function WILL change, so you
        !           646:  * MIGHT get a different order of symbols visited. In other words, if you
        !           647:  * want the same order of visiting symbols as the last time you used
        !           648:  * hash_apply() then you better not have done any hash_insert()s or
        !           649:  * hash_jam()s since the last time you used hash_apply().
        !           650:  *
        !           651:  * In future we may use the value returned by your nominated function.
        !           652:  * One idea is to abort the scan if, after applying the function to a
        !           653:  * certain node, the function returns a certain code.
        !           654:  * To be safe, please make your functions of type char *. If you always
        !           655:  * return NULL, then the scan will complete, visiting every symbol in
        !           656:  * the table exactly once. ALL OTHER RETURNED VALUES have no meaning yet!
        !           657:  * Caveat Actor!
        !           658:  *
        !           659:  * The function you supply should be of the form:
        !           660:  *      char * myfunct(string,value)
        !           661:  *              char * string;        |* the symbol's name *|
        !           662:  *              char * value;         |* the symbol's value *|
        !           663:  *      {
        !           664:  *        |* ... *|
        !           665:  *        return(NULL);
        !           666:  *      }
        !           667:  *
        !           668:  * The returned value of hash_apply() is (char*)NULL. In future it may return
        !           669:  * other values. NULL means "completed scan OK". Other values have no meaning
        !           670:  * yet. (The function has no graceful failures.)
        !           671:  */
        !           672: char *
        !           673: hash_apply(
        !           674: struct hash_control *handle,
        !           675: char *(*function)(char *hash_string, char *hash_value))
        !           676: {
        !           677:   register struct hash_entry *      entry;
        !           678:   register struct hash_entry *      wall;
        !           679: 
        !           680:   wall = handle->hash_wall;
        !           681:   for (entry = handle->hash_where; entry < wall; entry++)
        !           682:     {
        !           683:       if (islive(entry))       /* silly code: tests entry->string twice! */
        !           684:        {
        !           685:          (*function)(entry->hash_string,entry->hash_value);
        !           686:        }
        !           687:     }
        !           688:   return (NULL);
        !           689: }
        !           690: 
        !           691: /*
        !           692:  *          h a s h _ f i n d ( )
        !           693:  *
        !           694:  * Given symbol string, find value (if any).
        !           695:  * Return found value or NULL.
        !           696:  */
        !           697: char *
        !           698: hash_find(
        !           699: struct hash_control *handle,
        !           700: char *string)
        !           701: {
        !           702:   register struct hash_entry *      entry;
        !           703:   register char *                   retval;
        !           704: 
        !           705:   entry = hash_ask(handle,string,STAT__READ);
        !           706:   if (hash_found)
        !           707:     {
        !           708:       retval = entry->hash_value;
        !           709:     }
        !           710:   else
        !           711:     {
        !           712:       retval = NULL;
        !           713:     }
        !           714:   return(retval);
        !           715: }
        !           716: 
        !           717: /*
        !           718:  *          h a s h _ a s k ( )
        !           719:  *
        !           720:  * Searches for given symbol string.
        !           721:  * Return the slot where it OUGHT to live. It may be there.
        !           722:  * Return hash_found: TRUE only if symbol is in that slot.
        !           723:  * Access argument is to help keep statistics in control block.
        !           724:  * Internal.
        !           725:  */
        !           726: static
        !           727: struct hash_entry *    /* string slot, may be empty or deleted */
        !           728: hash_ask(
        !           729: struct hash_control * handle,
        !           730: char *                string,
        !           731: int                   access) /* access type */
        !           732: {
        !           733:   register char        *string1;       /* JF avoid strcmp calls */
        !           734:   register char *                   s;
        !           735:   register int                      c;
        !           736:   register struct hash_entry *      slot;
        !           737:   register int                      collision; /* count collisions */
        !           738: 
        !           739:   slot = handle->hash_where + hash_code(handle,string); /* start looking here */
        !           740:   handle->hash_stat[STAT_ACCESS+access] += 1;
        !           741:   collision = 0;
        !           742:   hash_found = FALSE;
        !           743:   while ( (s = slot->hash_string) && s!=DELETED )
        !           744:     {
        !           745:        for(string1=string;;) {
        !           746:                if(!(c= *s++)) {
        !           747:                        if(!*string1)
        !           748:                                hash_found = TRUE;
        !           749:                        break;
        !           750:                }
        !           751:                if(*string1++!=c)
        !           752:                        break;
        !           753:        }
        !           754:        if(hash_found)
        !           755:                break;
        !           756:       collision++;
        !           757:       slot++;
        !           758:     }
        !           759:   /*
        !           760:    * slot:                                                      return:
        !           761:    *       in use:     we found string                           slot
        !           762:    *       at empty:
        !           763:    *                   at wall:        we fell off: wrap round   ????
        !           764:    *                   in table:       dig here                  slot
        !           765:    *       at DELETED: dig here                                  slot
        !           766:    */
        !           767:   if (slot==handle->hash_wall)
        !           768:     {
        !           769:       slot = handle->hash_where; /* now look again */
        !           770:       while( (s = slot->hash_string) && s!=DELETED )
        !           771:        {
        !           772:          for(string1=string;*s;string1++,s++) {
        !           773:            if(*string1!=*s)
        !           774:                break;
        !           775:          }
        !           776:          if(*s==*string1) {
        !           777:              hash_found = TRUE;
        !           778:              break;
        !           779:            }
        !           780:          collision++;
        !           781:          slot++;
        !           782:        }
        !           783:       /*
        !           784:        * slot:                                                   return:
        !           785:        *       in use: we found it                                slot
        !           786:        *       empty:  wall:         ERROR IMPOSSIBLE             !!!!
        !           787:        *               in table:     dig here                     slot
        !           788:        *       DELETED:dig here                                   slot
        !           789:        */
        !           790:     }
        !           791: /*   fprintf(stderr,"hash_ask(%s)->%d(%d)\n",string,hash_code(handle,string),collision); */
        !           792:   handle -> hash_stat[STAT_COLLIDE+access] += collision;
        !           793:   return(slot);                        /* also return hash_found */
        !           794: }
        !           795: 
        !           796: /*
        !           797:  *           h a s h _ c o d e
        !           798:  *
        !           799:  * Does hashing of symbol string to hash number.
        !           800:  * Internal.
        !           801:  */
        !           802: static
        !           803: int
        !           804: hash_code(
        !           805: struct hash_control *handle,
        !           806: char *string)
        !           807: {
        !           808:   register long int                 h;      /* hash code built here */
        !           809:   register long int                 c;      /* each character lands here */
        !           810:   register int                    n;      /* Amount to shift h by */
        !           811: 
        !           812:   n = (handle->hash_sizelog - 3);
        !           813:   h = 0;
        !           814:   while((c = *string++))
        !           815:     {
        !           816:       h += c;
        !           817:       h = (h<<3) + (h>>n) + c;
        !           818:     }
        !           819:   return (h & handle->hash_mask);
        !           820: }
        !           821: 
        !           822: /*
        !           823:  * Here is a test program to exercise above.
        !           824:  */
        !           825: #ifdef TEST
        !           826: 
        !           827: #define TABLES (6)             /* number of hash tables to maintain */
        !           828:                                /* (at once) in any testing */
        !           829: #define STATBUFSIZE (12)       /* we can have 12 statistics */
        !           830: 
        !           831: int statbuf[STATBUFSIZE];      /* display statistics here */
        !           832: char answer[100];              /* human farts here */
        !           833: struct hash_control *
        !           834:        hashtable[TABLES];      /* we test many hash tables at once */
        !           835: struct hash_control * h;       /* points to curent hash_control */
        !           836: struct hash_control ** pp;
        !           837: struct hash_control *  p;
        !           838: char *  name;
        !           839: char *  value;
        !           840: int     size;
        !           841: int     used;
        !           842: char    command;
        !           843: int     number;                        /* number 0:TABLES-1 of current hashed */
        !           844:                                /* symbol table */
        !           845: static char *what(
        !           846:     char * description);
        !           847: static char *destroy(
        !           848:     char * string,
        !           849:     char * value);
        !           850: static char *applicatee(
        !           851:     char * string,
        !           852:     char * value);
        !           853: static void whattable(
        !           854:     void);
        !           855: 
        !           856: main()
        !           857: {
        !           858:   int *  ip;
        !           859:   char * error;
        !           860:   char * thing;
        !           861: 
        !           862:   number = 0;
        !           863:   h = NULL;
        !           864:   printf("type h <RETURN> for help\n");
        !           865:   for(;;)
        !           866:     {
        !           867:       printf("hash_test command: ");
        !           868:       gets(answer);
        !           869:       command = answer[0];
        !           870:       if (isupper(command)) command = tolower(command);        /* ecch! */
        !           871:       switch (command)
        !           872:        {
        !           873:        case '#':
        !           874:          printf("old hash table #=%d.\n",number);
        !           875:          whattable();
        !           876:          break;
        !           877:        case '?':
        !           878:          for (pp=hashtable; pp<hashtable+TABLES; pp++)
        !           879:            {
        !           880:              printf("address of hash table #%d control block is %xx\n"
        !           881:                     ,pp-hashtable,*pp);
        !           882:            }
        !           883:          break;
        !           884:        case 'a':
        !           885:          hash_apply(h,applicatee);
        !           886:          break;
        !           887:        case 'd':
        !           888:          hash_apply(h,destroy);
        !           889:          hash_die(h);
        !           890:          break;
        !           891:        case 'f':
        !           892:          thing = hash_find(h,name=what("symbol"));
        !           893:          printf("value of \"%s\" is \"%s\"\n",name,thing?thing:"NOT-PRESENT");
        !           894:          break;
        !           895:        case 'h':
        !           896:          printf("# show old, select new default hash table number\n");
        !           897:          printf("? display all hashtable control block addresses\n");
        !           898:          printf("a apply a simple display-er to each symbol in table\n");
        !           899:          printf("d die: destroy hashtable\n");
        !           900:          printf("f find value of nominated symbol\n");
        !           901:          printf("h this help\n");
        !           902:          printf("i insert value into symbol\n");
        !           903:          printf("j jam value into symbol\n");
        !           904:          printf("n new hashtable\n");
        !           905:          printf("r replace a value with another\n");
        !           906:          printf("s say what %% of table is used\n");
        !           907:          printf("q exit this program\n");
        !           908:          printf("x delete a symbol from table, report its value\n");
        !           909:          break;
        !           910:        case 'i':
        !           911:          error = hash_insert(h,name=what("symbol"),value=what("value"));
        !           912:          if(*error)
        !           913:            {
        !           914:              printf("symbol=\"%s\"  value=\"%s\"  error=%s\n",name,value,error);
        !           915:            }
        !           916:          break;
        !           917:        case 'j':
        !           918:          error = hash_jam(h,name=what("symbol"),value=what("value"));
        !           919:          if (*error)
        !           920:            {
        !           921:              printf("symbol=\"%s\"  value=\"%s\"  error=%s\n",name,value,error);
        !           922:            }
        !           923:          break;
        !           924:        case 'n':
        !           925:          h = hashtable[number] = hash_new();
        !           926:          break;
        !           927:        case 'q':
        !           928:          exit(0);
        !           929:        case 'r':
        !           930:          thing = hash_replace(h,name=what("symbol"),value=what("value"));
        !           931:          printf("old value was \"%s\"\n",thing?thing:"{}");
        !           932:          break;
        !           933:        case 's':
        !           934:          hash_say(h,statbuf,STATBUFSIZE);
        !           935:          for (ip=statbuf; ip<statbuf+STATBUFSIZE; ip++)
        !           936:            {
        !           937:              printf("%d ",*ip);
        !           938:            }
        !           939:          printf("\n");
        !           940:          break;
        !           941:        case 'x':
        !           942:          thing = hash_delete(h,name=what("symbol"));
        !           943:          printf("old value was \"%s\"\n",thing?thing:"{}");
        !           944:          break;
        !           945:        default:
        !           946:          printf("I can't understand command \"%c\"\n",command);
        !           947:          break;
        !           948:        }
        !           949:     }
        !           950: }
        !           951: 
        !           952: static
        !           953: char *
        !           954: what(
        !           955: char * description)
        !           956: {
        !           957:   char * retval;
        !           958: 
        !           959:   printf("   %s : ",description);
        !           960:   gets(answer);
        !           961:   /* will one day clean up answer here */
        !           962:   retval = malloc(strlen(answer)+1);
        !           963:   if (!retval)
        !           964:     {
        !           965: #ifdef NeXT
        !           966:       as_fatal("room");
        !           967: #else
        !           968:       error("room");
        !           969: #endif
        !           970:     }
        !           971:   (void)strcpy(retval,answer);
        !           972:   return(retval);
        !           973: }
        !           974: 
        !           975: static
        !           976: char *
        !           977: destroy(
        !           978: char * string,
        !           979: char * value)
        !           980: {
        !           981:   free(string);
        !           982:   free(value);
        !           983:   return(NULL);
        !           984: }
        !           985: 
        !           986: static
        !           987: char *
        !           988: applicatee(
        !           989: char * string,
        !           990: char * value)
        !           991: {
        !           992:   printf("%.20s-%.20s\n",string,value);
        !           993:   return(NULL);
        !           994: }
        !           995: 
        !           996: static
        !           997: void
        !           998: whattable(                     /* determine number: what hash table to use */
        !           999: void)                          /* also determine h: points to hash_control */
        !          1000: {
        !          1001: 
        !          1002:   for (;;)
        !          1003:     {
        !          1004:       printf("   what hash table (%d:%d) ?  ",0,TABLES-1);
        !          1005:       gets(answer);
        !          1006:       sscanf(answer,"%d",&number);
        !          1007:       if (number>=0 && number<TABLES)
        !          1008:        {
        !          1009:          h = hashtable[number];
        !          1010:          if (!h)
        !          1011:            {
        !          1012:              printf("warning: current hash-table-#%d. has no hash-control\n",number);
        !          1013:            }
        !          1014:          return;
        !          1015:        }
        !          1016:       else
        !          1017:        {
        !          1018:          printf("invalid hash table number: %d\n",number);
        !          1019:        }
        !          1020:     }
        !          1021: }
        !          1022: 
        !          1023: void *
        !          1024: xmalloc(
        !          1025: long n)
        !          1026: {
        !          1027:     void *retval;
        !          1028: 
        !          1029:        if(!(retval = malloc((unsigned)n))){
        !          1030:            printf("virtual memory exceeded\n");
        !          1031:            exit(1);
        !          1032:        }
        !          1033:        return(retval);
        !          1034: }
        !          1035: 
        !          1036: void *
        !          1037: xrealloc(
        !          1038: void *ptr,
        !          1039: long n)
        !          1040: {
        !          1041:     if((ptr = realloc(ptr, (unsigned)n)) == 0){
        !          1042:        printf("virtual memory exceeded\n");
        !          1043:        exit(1);
        !          1044:     }
        !          1045:     return(ptr);
        !          1046: }
        !          1047: 
        !          1048: void
        !          1049: as_fatal(
        !          1050: const char *format,
        !          1051: ...)
        !          1052: {
        !          1053:     va_list ap;
        !          1054: 
        !          1055:        va_start(ap, format);
        !          1056:        fprintf (stderr, "FATAL:");
        !          1057:        vfprintf(stderr, format, ap);
        !          1058:        fprintf(stderr, "\n");
        !          1059:        va_end(ap);
        !          1060:        exit(1);
        !          1061: }
        !          1062: #endif /* #ifdef TEST */

unix.superglobalmegacorp.com

This archive runs on limited infrastructure. Preserving old code on modern bandwidth. Automated agents are requested to crawl responsibly.