--- gforth/prims2x.fs 2001/01/23 10:05:36 1.72 +++ gforth/prims2x.fs 2001/03/18 10:33:25 1.91 @@ -40,6 +40,17 @@ \ add the store optimization for doubles \ regarding problem 1 above: It would be better (for over) to implement \ the alternative +\ store optimization for combined instructions. +\ eliminate stack-cast (no longer used) + +\ Design Uglyness: + +\ - global state (values, variables) in connection with combined instructions. + +\ - index computation is different for instruction-stream and the +\ stacks; there are two mechanisms for dealing with that +\ (stack-in-index-xt and a test for stack==instruction-stream); there +\ should be only one. warnings off @@ -49,6 +60,7 @@ warnings off \ different directory with the wordlibraries) include ./search.fs include ./extend.fs +include ./stuff.fs [THEN] [IFUNDEF] environment? @@ -89,6 +101,13 @@ skipsynclines on loop drop ; +: insert-wordlist { c-addr u wordlist xt -- } + \ adds name "addr u" to wordlist using defining word xt + \ xt may cause additional stack effects + get-current >r wordlist set-current + c-addr u nextname xt execute + r> set-current ; + : start ( -- addr ) cookedinput @ ; @@ -119,13 +138,10 @@ skipsynclines on variable output \ xt ( -- ) of output word for simple primitives variable output-combined \ xt ( -- ) of output word for combined primitives -: printprim ( -- ) - output @ execute ; - struct% cell% field stack-number \ the number of this stack cell% 2* field stack-pointer \ stackpointer name - cell% 2* field stack-typename \ name for default type of stack items + cell% field stack-type \ name for default type of stack items cell% 2* field stack-cast \ cast string for assignments to stack elements cell% field stack-in-index-xt \ ( in-size item -- in-index ) end-struct stack% @@ -155,22 +171,15 @@ create stacks max-stacks cells allot \ a : inst-in-index ( in-size item -- in-index ) nip dup item-offset @ swap item-type @ type-size @ + 1- ; -: make-stack ( addr-ptr u1 addr-stack u2 addr-cast u3 "stack-name" -- ) +: make-stack ( addr-ptr u1 type addr-cast u2 "stack-name" -- ) create stack% %allot >r r@ stacks next-stack-number @ th ! next-stack-number @ r@ stack-number ! 1 next-stack-number +! save-mem r@ stack-cast 2! - save-mem r@ stack-typename 2! + r@ stack-type ! save-mem r@ stack-pointer 2! ['] stack-in-index r> stack-in-index-xt ! ; -s" sp" save-mem s" Cell" save-mem s" (Cell)" make-stack data-stack -s" fp" save-mem s" Float" save-mem s" " make-stack fp-stack -s" rp" save-mem s" Cell" save-mem s" (Cell)" make-stack return-stack -s" IP" save-mem s" Cell" save-mem s" error don't use # on results" make-stack inst-stream -' inst-in-index inst-stream stack-in-index-xt ! -\ !! initialize stack-in and stack-out - \ stack items : init-item ( addr u addr1 -- ) @@ -185,6 +194,11 @@ s" IP" save-mem s" Cell" save-mem s" er i xt execute item% %size +loop ; +\ types + +: print-type-prefix ( type -- ) + body> >head name>string type ; + \ various variables for storing stuff of one primitive struct% @@ -195,6 +209,8 @@ struct% cell% 2* field prim-c-code cell% 2* field prim-forth-code cell% 2* field prim-stack-string + cell% field prim-num \ ordinal number + cell% field prim-items-wordlist \ unique items item% max-effect * field prim-effect-in item% max-effect * field prim-effect-out cell% field prim-effect-in-end @@ -208,15 +224,26 @@ end-struct prim% s" " p prim-doc 2! s" " p prim-forth-code 2! s" " p prim-wordset 2! p ; -0 value prim +0 value prim \ in combined prims either combined or a part +0 value combined \ in combined prims the combined prim +variable in-part \ true if processing a part + in-part off + +1000 constant max-combined +create combined-prims max-combined cells allot +variable num-combined + +table constant combinations + \ the keys are the sequences of pointers to primitives + +create current-depth max-stacks cells allot +create max-depth max-stacks cells allot +create min-depth max-stacks cells allot wordlist constant primitives : create-prim ( prim -- ) - get-current >r - primitives set-current - dup prim-name 2@ nextname constant - r> set-current ; + dup prim-name 2@ primitives ['] constant insert-wordlist ; : stack-in ( stack -- addr ) \ address of number of stack items in effect in @@ -234,11 +261,6 @@ variable name-line 2variable last-name-filename Variable function-number 0 function-number ! -\ for several reasons stack items of a word are stored in a wordlist -\ since neither forget nor marker are implemented yet, we make a new -\ wordlist for every word and store it in the variable items -variable items - \ a few more set ops : bit-equivalent ( w1 w2 -- w3 ) @@ -247,10 +269,9 @@ variable items : complement ( set1 -- set2 ) empty ['] bit-equivalent binary-set-operation ; -\ types +\ stack access stuff -: stack-access ( n stack -- ) - \ print a stack access at index n of stack +: normal-stack-access ( n stack -- ) stack-pointer 2@ type dup if @@ -259,25 +280,55 @@ variable items drop ." TOS" endif ; +\ forward declaration for inst-stream (breaks cycle in definitions) +defer inst-stream-f ( -- stack ) + +: part-stack-access { n stack -- } + \ print _, x=inst-stream? n : maxdepth-currentdepth-n-1 + ." _" stack stack-pointer 2@ type + stack stack-number @ { stack# } + current-depth stack# th @ n + { access-depth } + stack inst-stream-f = if + access-depth + else + combined prim-stacks-in stack# th @ + assert( dup max-depth stack# th @ = ) + access-depth - 1- + endif + 0 .r ; + +: stack-access ( n stack -- ) + \ print a stack access at index n of stack + in-part @ if + part-stack-access + else + normal-stack-access + endif ; + : item-in-index { item -- n } \ n is the index of item (in the in-effect) item item-stack @ dup >r stack-in @ ( in-size r:stack ) item r> stack-in-index-xt @ execute ; +: item-stack-type-name ( item -- addr u ) + item-stack @ stack-type @ type-c-name 2@ ; + : fetch-single ( item -- ) \ fetch a single stack item from its stack >r r@ item-name 2@ type - ." = (" - r@ item-type @ type-c-name 2@ type ." ) " + ." = vm_" r@ item-stack-type-name type + ." 2" r@ item-type @ print-type-prefix ." (" r@ item-in-index r@ item-stack @ stack-access - ." ;" cr + ." );" cr rdrop ; : fetch-double ( item -- ) \ fetch a double stack item from its stack >r - ." FETCH_DCELL(" + ." vm_two" + r@ item-stack-type-name type ." 2" + r@ item-type @ print-type-prefix ." (" r@ item-name 2@ type ." , " r@ item-in-index r@ item-stack @ 2dup ." (Cell)" stack-access ." , " -1 under+ ." (Cell)" stack-access @@ -287,8 +338,10 @@ variable items : same-as-in? ( item -- f ) \ f is true iff the offset and stack of item is the same as on input >r - r@ item-name 2@ items @ search-wordlist 0= - abort" bug" + r@ item-first @ if + rdrop false exit + endif + r@ item-name 2@ prim prim-items-wordlist @ search-wordlist 0= abort" bug" execute @ dup r@ = if \ item first appeared in output @@ -305,9 +358,10 @@ variable items : really-store-single ( item -- ) >r - r@ item-out-index r@ item-stack @ stack-access ." = " - r@ item-stack @ stack-cast 2@ type - r@ item-name 2@ type ." ;" + r@ item-out-index r@ item-stack @ stack-access ." = vm_" + r@ item-type @ print-type-prefix ." 2" + r@ item-stack-type-name type ." (" + r@ item-name 2@ type ." );" rdrop ; : store-single ( item -- ) @@ -327,7 +381,10 @@ variable items : store-double ( item -- ) \ !! store optimization is not performed, because it is not yet needed >r - ." STORE_DCELL(" r@ item-name 2@ type ." , " + ." vm_" + r@ item-type @ print-type-prefix ." 2two" + r@ item-stack-type-name type ." (" + r@ item-name 2@ type ." , " r@ item-out-index r@ item-stack @ 2dup stack-access ." , " -1 under+ stack-access ." );" cr @@ -375,7 +432,7 @@ does> ( item -- ) { item typ } typ item item-type ! typ type-stack @ item item-stack !default - item item-name 2@ items @ search-wordlist 0= if \ new name + item item-name 2@ prim prim-items-wordlist @ search-wordlist 0= if item item-name 2@ nextname item declare item item-first on \ typ type-c-name 2@ type space type ." ;" cr @@ -395,7 +452,7 @@ does> ( item -- ) endif -1 s+loop \ we did not find a type, abort - true abort" unknown prefix" ; + false s" unknown prefix" ?print-error ; : declaration ( item -- ) dup item-name 2@ execute-prefix ; @@ -404,7 +461,7 @@ does> ( item -- ) ['] declaration map-items ; : declarations ( -- ) - wordlist dup items ! set-current + wordlist dup prim prim-items-wordlist ! set-current prim prim-effect-in prim prim-effect-in-end @ declaration-list prim prim-effect-out prim prim-effect-out-end @ declaration-list ; @@ -426,6 +483,19 @@ does> ( item -- ) stack item item-stack ! item declaration ; +\ types pointed to by stacks for use in combined prims +\ !! output-c-combined shouldn't use these names! +s" Cell" single 0 create-type w +s" Float" single 0 create-type r + +s" sp" save-mem w s" (Cell)" make-stack data-stack +s" fp" save-mem r s" " make-stack fp-stack +s" rp" save-mem w s" (Cell)" make-stack return-stack +s" IP" save-mem w s" error don't use # on results" make-stack inst-stream +' inst-in-index inst-stream stack-in-index-xt ! +' inst-stream inst-stream-f +\ !! initialize stack-in and stack-out + \ offset computation \ the leftmost (i.e. deepest) item has offset 0 \ the rightmost item has the highest offset @@ -450,7 +520,13 @@ does> ( item -- ) inst-stream clear-stack prim prim-effect-in prim prim-effect-in-end @ ['] compute-offset-in map-items prim prim-effect-out prim prim-effect-out-end @ ['] compute-offset-out map-items - inst-stream stack-out @ 0<> abort" # can only be on the input side" ; + inst-stream stack-out @ 0= s" # can only be on the input side" ?print-error ; + +: process-simple ( -- ) + prim prim { W^ key } key cell + combinations ['] constant insert-wordlist + declarations compute-offsets + output @ execute ; : flush-a-tos { stack -- } stack stack-out @ 0<> stack stack-in @ 0= and @@ -509,41 +585,62 @@ does> ( item -- ) : stores ( -- ) prim prim-effect-out prim prim-effect-out-end @ ['] store map-items ; +: print-debug-arg { item -- } + ." fputs(" quote space item item-name 2@ type ." =" quote ." , vm_out); " + ." printarg_" item item-type @ print-type-prefix + ." (" item item-name 2@ type ." );" cr ; + +: print-debug-args ( -- ) + ." #ifdef VM_DEBUG" cr + ." if (vm_debug) {" cr + prim prim-effect-in prim prim-effect-in-end @ ['] print-debug-arg map-items +\ ." fputc('\n', vm_out);" cr + ." }" cr + ." #endif" cr ; + +: print-debug-result { item -- } + item item-first @ if + item print-debug-arg + endif ; + +: print-debug-results ( -- ) + cr + ." #ifdef VM_DEBUG" cr + ." if (vm_debug) {" cr + ." fputs(" quote ." -- " quote ." , vm_out); " + prim prim-effect-out prim prim-effect-out-end @ ['] print-debug-result map-items + ." fputc('\n', vm_out);" cr + ." }" cr + ." #endif" cr ; + +: output-super-end ( -- ) + prim prim-c-code 2@ s" SET_IP" search if + ." SUPER_END;" cr + endif + 2drop ; + : output-c-tail ( -- ) \ the final part of the generated C code + output-super-end + print-debug-results ." NEXT_P1;" cr stores fill-tos - ." NEXT_P2;" cr ; + ." NEXT_P2;" ; -: type-c ( c-addr u -- ) - \ like TYPE, but replaces "TAIL;" with tail code +: type-c-code ( c-addr u xt -- ) + \ like TYPE, but replaces "TAIL;" with tail code produced by xt + { xt } begin ( c-addr1 u1 ) 2dup s" TAIL;" search while ( c-addr1 u1 c-addr3 u3 ) 2dup 2>r drop nip over - type - output-c-tail + xt execute 2r> 5 /string \ !! resync #line missing repeat 2drop type ; -: print-type-prefix ( type -- ) - body> >head .name ; - -: print-debug-arg { item -- } - ." fputs(" quote space item item-name 2@ type ." =" quote ." , vm_out); " - ." printarg_" item item-type @ print-type-prefix - ." (" item item-name 2@ type ." );" cr ; - -: print-debug-args ( -- ) - ." #ifdef VM_DEBUG" cr - ." if (vm_debug) {" cr - prim prim-effect-in prim prim-effect-in-end @ ['] print-debug-arg map-items - ." fputc('\n', vm_out);" cr - ." }" cr - ." #endif" cr ; - : print-entry ( -- ) ." I_" prim prim-c-name 2@ type ." :" ; @@ -561,7 +658,7 @@ does> ( item -- ) stack-pointer-updates ." {" cr ." #line " c-line @ . quote c-filename 2@ type quote cr - prim prim-c-code 2@ type-c + prim prim-c-code 2@ ['] output-c-tail type-c-code ." }" cr output-c-tail ." }" cr @@ -585,7 +682,21 @@ does> ( item -- ) ." fputs(" quote prim prim-name 2@ type quote ." , vm_out);" cr disasm-args ." ip += " inst-stream stack-in @ 1+ 0 .r ." ;" cr - ." } else " ; + ." goto _endif_;" cr + ." }" cr ; + +: output-profile ( -- ) + \ generate code for postprocessing the VM block profile stuff + ." if (VM_IS_INST(*ip, " function-number @ 0 .r ." )) {" cr + ." add_inst(b, " quote prim prim-name 2@ type quote ." );" cr + ." ip += " inst-stream stack-in @ 1+ 0 .r ." ;" cr + prim prim-c-code 2@ s" SET_IP" search nip nip + prim prim-c-code 2@ s" SUPER_END" search nip nip or if + ." return;" cr + else + ." goto _endif_;" cr + endif + ." }" cr ; : gen-arg-parm { item -- } item item-stack @ inst-stream = if @@ -684,14 +795,12 @@ does> ( item -- ) [IFDEF] documentation : register-doc ( -- ) - get-current documentation set-current - prim prim-name 2@ nextname create + prim prim-name 2@ documentation ['] create insert-wordlist prim prim-name 2@ 2, prim prim-stack-string 2@ condition-stack-effect 2, prim prim-wordset 2@ 2, prim prim-c-name 2@ condition-pronounciation 2, - prim prim-doc 2@ 2, - set-current ; + prim prim-doc 2@ 2, ; [THEN] @@ -761,15 +870,8 @@ does> ( item -- ) \ spTOS = (Cell)_x_sp0; \ NEXT_P2; -1000 constant max-combined -create combined-prims max-combined cells allot -variable num-combined - -create current-depth max-stacks cells allot -create max-depth max-stacks cells allot -create min-depth max-stacks cells allot - : init-combined ( -- ) + prim to combined 0 num-combined ! current-depth max-stacks cells erase max-depth max-stacks cells erase @@ -820,7 +922,7 @@ create min-depth max-stacks cells al i 0 <# #s stack stack-pointer 2@ holds [char] _ hold #> save-mem item item-name 2! stack item item-stack ! - 0 item item-type ! + stack stack-type @ item item-type ! i item item-offset ! item item-first on item% %size effect-endp +! @@ -834,6 +936,10 @@ create min-depth max-stacks cells al loop ; : process-combined ( -- ) + combined combined-prims num-combined @ cells + combinations ['] constant insert-wordlist + combined-prims num-combined @ 1- th ( last-part ) + @ prim-c-code 2@ prim prim-c-code 2! \ used by output-super-end prim compute-effects prim init-effects output-combined perform ; @@ -842,8 +948,8 @@ create min-depth max-stacks cells al : print-item { n stack -- } \ print nth stack item name - ." _" stack stack-typename 2@ type space - stack stack-pointer 2@ type n 0 .r ; + stack stack-type @ type-c-name 2@ type space + ." _" stack stack-pointer 2@ type n 0 .r ; : print-declarations-combined ( -- ) max-stacks 0 ?do @@ -851,20 +957,91 @@ create min-depth max-stacks cells al i stacks j th @ print-item ." ;" cr loop loop ; - + +: part-fetches ( -- ) + fetches ; + +: part-output-c-tail ( -- ) + print-debug-results + stores ; + +: output-combined-tail ( -- ) + part-output-c-tail + prim >r combined to prim + in-part @ >r in-part off + output-c-tail + r> in-part ! r> to prim ; + +: output-part ( p -- ) + to prim + ." /* " prim prim-name 2@ type ." ( " prim prim-stack-string 2@ type ." ) */" cr + ." NAME(" quote prim prim-name 2@ type quote ." )" cr \ debugging + ." {" cr + print-declarations + part-fetches + print-debug-args + prim add-depths \ !! right place? + ." {" cr + ." #line " c-line @ . quote c-filename 2@ type quote cr + prim prim-c-code 2@ ['] output-combined-tail type-c-code + ." }" cr + part-output-c-tail + ." }" cr ; + +: output-parts ( -- ) + prim >r in-part on + current-depth max-stacks cells erase + num-combined @ 0 +do + combined-prims i th @ output-part + loop + in-part off + r> to prim ; + : output-c-combined ( -- ) print-entry cr - \ debugging messages just in constituents + \ debugging messages just in parts ." {" cr ." DEF_CA" cr print-declarations-combined ." NEXT_P0;" cr flush-tos fetches - ; + \ print-debug-args + stack-pointer-updates + output-parts + output-c-tail + ." }" cr + cr ; : output-forth-combined ( -- ) - ; +; + + +\ peephole optimization rules + +\ in order for this to work as intended, shorter combinations for each +\ length must be present, and the longer combinations must follow +\ shorter ones (this restriction may go away in the future). + +: output-peephole ( -- ) + combined-prims num-combined @ 1- cells combinations search-wordlist + s" the prefix for this combination must be defined earlier" ?print-error + ." {" + execute prim-num @ 5 .r ." ," + combined-prims num-combined @ 1- th @ prim-num @ 5 .r ." ," + combined prim-num @ 5 .r ." }, /* " + combined prim-c-name 2@ type ." */" + cr ; + +: output-forth-peephole ( -- ) + combined-prims num-combined @ 1- cells combinations search-wordlist + s" the prefix for this combination must be defined earlier" ?print-error + execute prim-num @ 5 .r + combined-prims num-combined @ 1- th @ prim-num @ 5 .r + combined prim-num @ 5 .r ." prim, \ " + combined prim-c-name 2@ type + cr ; + \ the parser @@ -899,11 +1076,11 @@ print-token ! endif 0. r> 6 chars + 20 >number drop >r drop line ! r> ( c-addr ) dup c@ bl = if - char+ dup c@ [char] " <> abort" sync line syntax" + char+ dup c@ [char] " <> 0= s" sync line syntax" ?print-error char+ dup 100 [char] " scan drop swap 2dup - save-mem filename 2! char+ endif - dup c@ nl-char <> abort" sync line syntax" + dup c@ nl-char <> 0= s" sync line syntax" ?print-error skipsynclines @ if dup char+ rawinput ! rawinput @ c@ cookedinput @ c! @@ -949,7 +1126,7 @@ bl 1+ maxchar .. char " singleton eof-char over add-member complement charclass noquote nl-char singleton charclass nl eof-char singleton charclass eof - +nl-char singleton eof-char over add-member charclass nleof (( letter (( letter || digit )) ** )) <- c-ident ( -- ) @@ -995,7 +1172,7 @@ Variable c-flag (( (( eval-comment || forth-comment || c-comment || else-comment || if-comment )) ?? nonl ** )) <- comment-body -(( ` \ comment-body nl )) <- comment ( -- ) +(( ` \ comment-body nleof )) <- comment ( -- ) (( {{ start }} stack-ident {{ end 2 pick init-item item% %size + }} white ** )) ** <- stack-items @@ -1009,24 +1186,25 @@ Variable c-flag ` ( white ** {{ start }} stack-effect {{ end prim prim-stack-string 2! }} ` ) white ** (( {{ start }} forth-ident {{ end prim prim-wordset 2! }} white ** (( {{ start }} c-ident {{ end prim prim-c-name 2! }} )) ?? - )) ?? nl - (( ` " ` " {{ start }} (( noquote ++ ` " )) ++ {{ end 1- prim prim-doc 2! }} ` " white ** nl )) ?? - {{ skipsynclines off line @ c-line ! filename 2@ c-filename 2! start }} (( nocolonnl nonl ** nl white ** )) ** {{ end prim prim-c-code 2! skipsynclines on }} - (( ` : white ** nl - {{ start }} (( nonl ++ nl white ** )) ++ {{ end prim prim-forth-code 2! }} - )) ?? {{ declarations compute-offsets printprim 1 function-number +! }} - (( nl || eof )) + )) ?? nleof + (( ` " ` " {{ start }} (( noquote ++ ` " )) ++ {{ end 1- prim prim-doc 2! }} ` " white ** nleof )) ?? + {{ skipsynclines off line @ c-line ! filename 2@ c-filename 2! start }} (( nocolonnl nonl ** nleof white ** )) ** {{ end prim prim-c-code 2! skipsynclines on }} + (( ` : white ** nleof + {{ start }} (( nonl ++ nleof white ** )) ++ {{ end prim prim-forth-code 2! }} + )) ?? {{ process-simple }} + nleof )) <- simple-primitive ( -- ) (( {{ init-combined }} - ` = (( white ++ {{ start }} forth-ident {{ end add-prim }} )) ++ - (( nl || eof )) {{ process-combined }} + ` = white ** (( {{ start }} forth-ident {{ end add-prim }} white ** )) ++ + nleof {{ process-combined }} )) <- combined-primitive -(( {{ make-prim to prim +(( {{ make-prim to prim 0 to combined line @ name-line ! filename 2@ name-filename 2! + function-number @ prim prim-num ! start }} forth-ident {{ end 2dup prim prim-name 2! prim prim-c-name 2! }} white ++ - (( simple-primitive || combined-primitive )) + (( simple-primitive || combined-primitive )) {{ 1 function-number +! }} )) <- primitive ( -- ) (( (( comment || primitive || nl white ** )) ** eof ))