Diff for /gforth/hash.fs between versions 1.1 and 1.30

version 1.1, 1994/07/21 10:52:43 version 1.30, 2002/12/07 18:07:19
Line 1 Line 1
 \ Hashed dictionaries                                  15jul94py  \ Hashed dictionaries                                  15jul94py
   
 $80 Value Hashlen  \ Copyright (C) 1995,1998,2000 Free Software Foundation, Inc.
   
   \ This file is part of Gforth.
   
   \ Gforth is free software; you can redistribute it and/or
   \ modify it under the terms of the GNU General Public License
   \ as published by the Free Software Foundation; either version 2
   \ of the License, or (at your option) any later version.
   
   \ This program is distributed in the hope that it will be useful,
   \ but WITHOUT ANY WARRANTY; without even the implied warranty of
   \ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   \ GNU General Public License for more details.
   
   \ You should have received a copy of the GNU General Public License
   \ along with this program; if not, write to the Free Software
   \ Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
   
   [IFUNDEF] erase
   : erase ( addr len -- ) 0 fill ;
   [THEN]
   
   [IFUNDEF] allocate
   : reserve-mem here swap allot ;
   \ move to a kernel/memory.fs
   [ELSE]
   : reserve-mem allocate throw ;
   [THEN]
   
   [IFUNDEF] hashbits
   11 Value hashbits
   [THEN]
   1 hashbits lshift Value Hashlen
   
   \ compute hash key                                     15jul94py
   
   has? ec [IF] [IFUNDEF] hash
   : hash ( addr len -- key )
     over c@ swap 1- IF swap char+ c@ + ELSE nip THEN
     [ Hashlen 1- ] literal and ;
   [THEN] [THEN]
   
   [IFUNDEF] hash
   : hash ( addr len -- key )
       hashbits (hashkey1) ;
   [THEN]
   
 Variable insRule        insRule on  Variable insRule        insRule on
   Variable revealed
   
 \ Memory handling                                      15jul94py  \ Memory handling                                      10oct94py
   
 Variable HashPointer  AVariable HashPointer
   Variable HashIndex     \ Number of wordlists
   Variable HashPop       \ Number of words
   0 AValue HashTable
   
 : hash-alloc ( addr -- addr )  dup @ 0= IF  \ forward declarations
   Hashlen cells allocate throw over !  0 AValue hashsearch-map
   dup @ Hashlen cells erase THEN ;  Defer hash-alloc ( addr -- addr )
   
 \ DelFix and NewFix is from bigFORTH                   15jul94py  \ DelFix and NewFix are from bigFORTH                  15jul94py
   
 : DelFix ( addr root -- ) dup @ 2 pick ! ! ;  : DelFix ( addr root -- ) dup @ 2 pick ! ! ;
 : NewFix  ( root len # -- addr )  : NewFix  ( root len # -- addr )
   BEGIN  2 pick @ ?dup  0= WHILE  2dup * allocate throw    BEGIN  2 pick @ ?dup  0= WHILE  2dup * reserve-mem
          over 0 ?DO  dup 4 pick DelFix 2 pick +  LOOP  drop           over 0 ?DO  dup 4 pick DelFix 2 pick +  LOOP  drop
   REPEAT  >r drop r@ @ rot ! r@ swap erase r> ;    REPEAT  >r drop r@ @ rot ! r@ swap erase r> ;
   
 \ compute hash key                                     15jul94py  : bucket ( addr len wordlist -- bucket-addr )
       \ @var{bucket-addr} is the address of a cell that points to the first
       \ element in the list of the bucket for the string @var{addr len}
       wordlist-extend @ -rot hash xor ( bucket# )
       cells HashTable + ;
   
 : hash ( addr len -- key )  (hashkey)  : hash-find ( addr len wordlist -- nfa / false )
 \  tuck bounds  ?DO  I c@ toupper +  LOOP      >r 2dup r> bucket @ (hashlfind) ;
   Hashlen 1- and ;  
   
 : hash-find ( addr len wordlist -- nfa / false ) $C + @ >r  
   2dup hash cells r> + @ (hashfind) ;  
 \  BEGIN  dup  WHILE  
 \         2@ >r >r dup r@ cell+ c@ $1F and =  
 \         IF  2dup r@ cell+ char+ capscomp 0=  
 \            IF  2drop r> rdrop  EXIT  THEN  THEN  
 \        rdrop r>  
 \  REPEAT nip nip ;  
   
 \ hash vocabularies                                    16jul94py  \ hash vocabularies                                    16jul94py
   
 : lastlink! ( addr link -- )  : lastlink! ( addr link -- )
   BEGIN  dup @ dup  WHILE  nip  REPEAT  drop ! ;    BEGIN  dup @ dup  WHILE  nip  REPEAT  drop ! ;
   
 : (reveal ( addr voc -- )  $C + dup @ 0< IF  2drop EXIT  THEN  : (reveal ( nfa wid -- )
   hash-alloc @ over cell+ count $1F and Hash cells + >r      over name>string rot bucket >r
   HashPointer 8 $400 NewFix      HashPointer 2 Cells $400 NewFix
   tuck cell+ ! r> insRule @      tuck cell+ ! r> insRule @
   IF  dup @ 2 pick ! !  ELSE  lastlink!  THEN ;      IF
           dup @ 2 pick ! !
 : hash-reveal ( -- )  (reveal) last?  IF      ELSE
   current @ (reveal  THEN ;          lastlink!
       THEN
 Create hashsearch  ' hash-find A,  ' hash-reveal A,  ' drop A,      revealed on 1 HashPop +! 0 hash-alloc drop ;
   
 : (initvoc ( addr -- )  cell+ dup @ 0< IF  drop EXIT  THEN  : hash-reveal ( nfa wid -- )
   insRule @ >r  insRule off  hash-alloc      2dup (reveal) (reveal ;
   3 cells - hashsearch over cell+ ! dup  
   BEGIN  @ dup  WHILE  2dup swap (reveal  REPEAT  : inithash ( wid -- )
   2drop  r> insRule ! ;      wordlist-extend
       insRule @ >r  insRule off  1 hash-alloc over ! 3 cells -
 ' (initvoc IS 'initvoc      dup wordlist-id
       BEGIN  @ dup  WHILE  2dup swap (reveal  REPEAT
 : addall  ( -- )  voclink      2drop  r> insRule ! ;
   BEGIN  @ dup @  WHILE  dup (initvoc  REPEAT  drop ;  
   : addall  ( -- )
       HashPop off voclink
       BEGIN  @ dup WHILE
              dup 0 wordlist-link -
              dup wordlist-map @ reveal-method @ ['] hash-reveal = 
              IF  inithash ELSE drop THEN
       REPEAT  drop ;
   
   : clearhash  ( -- )
       HashTable Hashlen cells bounds
       DO  I @
           BEGIN  dup  WHILE
               dup @ swap HashPointer DelFix
           REPEAT
           I !
           cell +LOOP
       HashIndex off 
       voclink
       BEGIN ( wordlist-link-addr )
           @ dup
       WHILE ( wordlist-link )
           dup 0 wordlist-link - ( wordlist-link wid ) 
           dup wordlist-map @ hashsearch-map = 
           IF ( wordlist-link wid )
               0 swap wordlist-extend !
           ELSE
               drop
           THEN
       REPEAT
       drop ;
   
   : rehashall  ( wid -- ) 
     drop revealed @ 
     IF    clearhash addall revealed off 
     THEN ;
   
   : (rehash)   ( wid -- )
     dup wordlist-extend @ 0=
     IF   inithash
     ELSE rehashall THEN ;
   
   : hashdouble ( -- )
       HashTable >r clearhash
       1 hashbits 1+ dup  to hashbits  lshift  to hashlen
       r> free >r  0 to HashTable
       addall r> throw ;
   
   const Create (hashsearch-map)
   ' hash-find A, ' hash-reveal A, ' (rehash) A, ' (rehash) A,
   (hashsearch-map) to hashsearch-map
   
   \ hash allocate and vocabulary initialization          10oct94py
   
   :noname ( n+ -- n )
     HashTable 0= 
     IF  Hashlen cells reserve-mem TO HashTable
         HashTable Hashlen cells erase THEN
     HashIndex @ swap HashIndex +!
     HashIndex @ Hashlen >=
     [ [IFUNDEF] allocate ]
     ABORT" no more space in hashtable"
     [ [ELSE] ]
     HashPop @ hashlen 2* >= or
     IF  hashdouble  THEN 
     [ [THEN] ] ; is hash-alloc
   
 \ Hash-Find                                            01jan93py  \ Hash-Find                                            01jan93py
   has? cross 0= 
   [IF]
   : make-hash
     hashsearch-map forth-wordlist wordlist-map !
     addall ;
     make-hash \ Baumsuche ist installiert.
   [ELSE]
     hashsearch-map forth-wordlist wordlist-map !
   [THEN]
   
   \ for ec version display that vocabulary goes hashed
   
   : hash-cold  ( -- )
   [ has? ec [IF] ] ." Hashing..." [ [THEN] ]
     HashPointer off  0 TO HashTable  HashIndex off
     addall
   \  voclink
   \  BEGIN  @ dup WHILE
   \         dup 0 wordlist-link - initvoc
   \  REPEAT  drop 
   [ has? ec [IF] ] ." Done" cr [ [THEN] ] ;
   
 addall          \ Baum aufbauen  ' hash-cold INIT8 chained
 \ Baumsuche ist installiert.  
   
 : .words  ( -- )  : .words  ( -- )
   base @ >r hex context @ 3 cells +  HashLen 0    base @ >r hex HashTable  Hashlen 0
   DO  cr  i 2 .r ." : " dup @ i cells +    DO  cr  i 2 .r ." : " dup i cells +
       BEGIN  @ dup  WHILE        BEGIN  @ dup  WHILE
              dup cell+ @ .name  REPEAT  drop               dup cell+ @ name>string type space  REPEAT  drop
   LOOP  drop r> base ! ;    LOOP  drop r> base ! ;
   
   \ \ this stuff is for evaluating the hash function
   \ : square dup * ;
   
   \ : countwl  ( -- sum sumsq )
   \     \ gives the number of words in the current wordlist
   \     \ and the sum of squares for the sublist lengths
   \     0 0
   \     hashtable Hashlen cells bounds DO
   \        0 i BEGIN
   \            @ dup WHILE
   \            swap 1+ swap
   \        REPEAT
   \        drop
   \        swap over square +
   \        >r + r>
   \        1 cells
   \    +LOOP ;
   
   \ : chisq ( -- n )
   \     \ n should have about the same size as Hashlen
   \     countwl Hashlen 2 pick */ swap - ;

Removed from v.1.1  
changed lines
  Added in v.1.30


FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>