version 1.7, 2000/09/23 15:47:08
|
version 1.39, 2008/08/09 13:24:25
|
Line 1
|
Line 1
|
/* This file defines a number of threading schemes. |
/* This file defines a number of threading schemes. |
|
|
Copyright (C) 1995, 1996,1997,1999 Free Software Foundation, Inc. |
Copyright (C) 1995, 1996,1997,1999,2003,2004,2005,2007 Free Software Foundation, Inc. |
|
|
This file is part of Gforth. |
This file is part of Gforth. |
|
|
Gforth is free software; you can redistribute it and/or |
Gforth is free software; you can redistribute it and/or |
modify it under the terms of the GNU General Public License |
modify it under the terms of the GNU General Public License |
as published by the Free Software Foundation; either version 2 |
as published by the Free Software Foundation, either version 3 |
of the License, or (at your option) any later version. |
of the License, or (at your option) any later version. |
|
|
This program is distributed in the hope that it will be useful, |
This program is distributed in the hope that it will be useful, |
Line 15
|
Line 15
|
GNU General Public License for more details. |
GNU General Public License for more details. |
|
|
You should have received a copy of the GNU General Public License |
You should have received a copy of the GNU General Public License |
along with this program; if not, write to the Free Software |
along with this program; if not, see http://www.gnu.org/licenses/. |
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA. |
|
|
|
|
|
This files defines macros for threading. Many sets of macros are |
This files defines macros for threading. Many sets of macros are |
Line 91
|
Line 90
|
|
|
*/ |
*/ |
|
|
/* CFA_NEXT: if NEXT uses cfa, you have to #define CFA_NEXT, to get |
#if !defined(GCC_PR15242_WORKAROUND) |
* cfa declared in engine. |
#if __GNUC__ == 3 |
*/ |
/* various gcc-3.x version have problems (including PR15242) that are |
|
solved with this workaround */ |
#ifdef DOUBLY_INDIRECT |
#define GCC_PR15242_WORKAROUND 1 |
# define CFA_NEXT |
#else |
# define NEXT_P0 ({cfa=*ip;}) |
/* other gcc versions are better off without the workaround for |
# define IP (ip) |
primitives that are not relocatable */ |
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
#define GCC_PR15242_WORKAROUND 0 |
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ip++; ca=**cfa;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({DEF_CA cfa=(XT); ca=**cfa; goto *ca;}) |
|
# define NEXT1_P1 ({ca = **cfa;}) |
|
# define NEXT1_P2 ({goto *ca;}) |
|
|
|
#else /* !defined(DOUBLY_INDIRECT) */ |
|
|
|
#if defined(DIRECT_THREADED) |
|
|
|
/* note that the "cfa dead" versions only work if GETCFA exists and works */ |
|
|
|
#if THREADING_SCHEME==1 |
|
#warning direct threading scheme 1: autoinc, long latency, cfa live |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip++;}) |
|
# define IP (ip-1) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({goto *cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==2 |
|
#warning direct threading scheme 2: autoinc, long latency, cfa dead |
|
#ifndef GETCFA |
|
#error GETCFA must be defined for cfa dead threading |
|
#endif |
#endif |
# define NEXT_P0 (ip++) |
|
# define IP (ip-1) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*(ip-1)) |
|
# define INC_IP(const_inc) ({ ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({goto **(ip-1);}) |
|
# define EXEC(XT) ({goto *(XT);}) |
|
#endif |
#endif |
|
|
|
#if GCC_PR15242_WORKAROUND |
#if THREADING_SCHEME==3 |
#define DO_GOTO goto before_goto |
#warning direct threading scheme 3: autoinc, low latency, cfa live |
#else |
# define CFA_NEXT |
#define DO_GOTO goto *real_ca |
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*ip) |
|
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 ({cfa=*ip++;}) |
|
# define NEXT_P2 ({goto *cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
#endif |
#endif |
|
|
#if THREADING_SCHEME==4 |
#ifndef GOTO_ALIGN |
#warning direct threading scheme 4: autoinc, low latency, cfa dead |
#define GOTO_ALIGN |
#ifndef GETCFA |
|
#error GETCFA must be defined for cfa dead threading |
|
#endif |
|
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*ip) |
|
# define INC_IP(const_inc) ({ ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({goto **(ip++);}) |
|
# define EXEC(XT) ({goto *(XT);}) |
|
#endif |
#endif |
|
|
#if THREADING_SCHEME==5 |
#define GOTO(target) do {(real_ca=(target));} while(0) |
#warning direct threading scheme 5: long latency, cfa live |
#define NEXT_P2 do {NEXT_P1_5; DO_GOTO;} while(0) |
# define CFA_NEXT |
#define EXEC(XT) do { real_ca=EXEC1(XT); DO_GOTO;} while (0) |
# define NEXT_P0 ({cfa=*ip;}) |
#define VM_JUMP(target) do {GOTO(target);} while (0) |
# define IP (ip) |
#define NEXT do {DEF_CA NEXT_P1; NEXT_P2;} while(0) |
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
#define FIRST_NEXT_P2 NEXT_P1_5; GOTO_ALIGN; \ |
# define NEXT_INST (cfa) |
before_goto: goto *real_ca; after_goto: |
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
#define FIRST_NEXT do {DEF_CA NEXT_P1; FIRST_NEXT_P2;} while(0) |
# define DEF_CA |
#define IPTOS NEXT_INST |
# define NEXT_P1 (ip++) |
|
# define NEXT_P2 ({goto *cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==6 |
|
#warning direct threading scheme 6: long latency, cfa dead |
|
#ifndef GETCFA |
|
#error GETCFA must be defined for cfa dead threading |
|
#endif |
|
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*ip) |
|
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 (ip++) |
|
# define NEXT_P2 ({goto **(ip-1);}) |
|
# define EXEC(XT) ({goto *(XT);}) |
|
#endif |
|
|
|
|
#ifdef DOUBLY_INDIRECT |
|
# ifndef DEBUG_DITC |
|
# define DEBUG_DITC 0 |
|
# endif |
|
/* define to 1 if you want to check consistency */ |
|
# define NEXT_P0 do {cfa1=cfa; cfa=*ip;} while(0) |
|
# define CFA cfa1 |
|
# define MORE_VARS Xt cfa1; |
|
# define IP (ip) |
|
# define SET_IP(p) do {ip=(p); cfa=*ip;} while(0) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) do {cfa=IP[const_inc]; ip+=(const_inc);} while(0) |
|
# define DEF_CA Label MAYBE_UNUSED ca; |
|
# define NEXT_P1 do {\ |
|
if (DEBUG_DITC && (cfa<=vm_prims+DOESJUMP || cfa>=vm_prims+npriminfos)) \ |
|
fprintf(stderr,"NEXT encountered prim %p at ip=%p\n", cfa, ip); \ |
|
ip++;} while(0) |
|
# define NEXT_P1_5 do {ca=**cfa; GOTO(ca);} while(0) |
|
# define EXEC1(XT) ({DEF_CA cfa=(XT);\ |
|
if (DEBUG_DITC && (cfa>vm_prims+DOESJUMP && cfa<vm_prims+npriminfos)) \ |
|
fprintf(stderr,"EXEC encountered xt %p at ip=%p, vm_prims=%p, xts=%p\n", cfa, ip, vm_prims, xts); \ |
|
ca=**cfa; ca;}) |
|
|
|
#elif defined(NO_IP) |
|
|
|
#define NEXT_P0 |
|
# define CFA cfa |
|
#define SET_IP(target) assert(0) |
|
#define INC_IP(n) ((void)0) |
|
#define DEF_CA |
|
#define NEXT_P1 |
|
#define NEXT_P1_5 do {goto *next_code;} while(0) |
|
/* set next_code to the return address before performing EXEC */ |
|
/* original: */ |
|
/* #define EXEC1(XT) do {cfa=(XT); goto **cfa;} while(0) */ |
|
/* fake, to make syntax check work */ |
|
#define EXEC1(XT) ({cfa=(XT); *cfa;}) |
|
|
#if THREADING_SCHEME==7 |
#else /* !defined(DOUBLY_INDIRECT) && !defined(NO_IP) */ |
#warning direct threading scheme 7: low latency, cfa live |
|
# define CFA_NEXT |
|
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*ip) |
|
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 ({cfa=*ip++;}) |
|
# define NEXT_P2 ({goto *cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==8 |
#if defined(DIRECT_THREADED) |
#warning direct threading scheme 8: cfa dead, i386 hack |
|
#ifndef GETCFA |
|
#error GETCFA must be defined for cfa dead threading |
|
#endif |
|
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*IP) |
|
# define INC_IP(const_inc) ({ ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 (ip++) |
|
# define NEXT_P2 ({goto **(ip-1);}) |
|
# define EXEC(XT) ({goto *(XT);}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==9 |
/* This lets the compiler know that cfa is dead before; we place it at |
#warning direct threading scheme 9: Power/PPC hack, long latency |
"goto *"s that perform direct threaded dispatch (i.e., not EXECUTE |
/* Power uses a prepare-to-branch instruction, and the latency between |
etc.), and thus do not reach doers, which would use cfa; the only |
this inst and the branch is 5 cycles on a PPC604; so we utilize this |
way to a doer is through EXECUTE etc., which set the cfa |
to do some prefetching in between */ |
themselves. |
# define CFA_NEXT |
|
# define NEXT_P0 |
|
# define IP ip |
|
# define SET_IP(p) ({ip=(p); next_cfa=*ip; NEXT_P0;}) |
|
# define NEXT_INST (next_cfa) |
|
# define INC_IP(const_inc) ({next_cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ca=next_cfa; cfa=next_cfa; ip++; next_cfa=*ip;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
# define MORE_VARS Xt next_cfa; |
|
#endif |
|
|
|
#if THREADING_SCHEME==10 |
Some of these direct threaded schemes use "cfa" to hold the code |
#warning direct threading scheme 10: plain (no attempt at scheduling) |
address in normal direct threaded code. Of course we cannot use |
# define CFA_NEXT |
KILLS there. |
# define NEXT_P0 |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (*ip) |
|
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({cfa=*ip++; goto *cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto *cfa;}) |
|
#endif |
|
|
|
/* direct threaded */ |
KILLS works by having an empty asm instruction, and claiming to the |
#else |
compiler that it writes to cfa. |
/* indirect THREADED */ |
|
|
|
#if THREADING_SCHEME==1 |
KILLS is optional. You can write |
#warning indirect threading scheme 1: autoinc, long latency, cisc |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip++;}) |
|
# define IP (ip-1) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({goto **cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto **cfa;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==2 |
#define KILLS |
#warning indirect threading scheme 2: autoinc, long latency |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip++;}) |
|
# define IP (ip-1) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ca=*cfa;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({DEF_CA cfa=(XT); ca=*cfa; goto *ca;}) |
|
#endif |
|
|
|
|
and lose just a little performance. |
|
*/ |
|
#define KILLS asm("":"=X"(cfa)); |
|
|
#if THREADING_SCHEME==3 |
/* #warning direct threading scheme 8: cfa dead, i386 hack */ |
#warning indirect threading scheme 3: autoinc, low latency, cisc |
|
# define CFA_NEXT |
|
# define NEXT_P0 |
# define NEXT_P0 |
|
# define CFA cfa |
# define IP (ip) |
# define IP (ip) |
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
# define SET_IP(p) do {ip=(p); NEXT_P0;} while(0) |
# define NEXT_INST (*ip) |
# define NEXT_INST (*IP) |
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
# define INC_IP(const_inc) do { ip+=(const_inc);} while(0) |
# define DEF_CA |
|
# define NEXT_P1 |
|
# define NEXT_P2 ({cfa=*ip++; goto **cfa;}) |
|
# define EXEC(XT) ({cfa=(XT); goto **cfa;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==4 |
|
#warning indirect threading scheme 4: autoinc, low latency |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip++;}) |
|
# define IP (ip-1) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ca=*cfa;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({DEF_CA cfa=(XT); ca=*cfa; goto *ca;}) |
|
#endif |
|
|
|
|
|
#if THREADING_SCHEME==5 |
|
#warning indirect threading scheme 5: long latency, cisc |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip;}) |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA |
# define DEF_CA |
# define NEXT_P1 (ip++) |
# define NEXT_P1 (ip++) |
# define NEXT_P2 ({goto **cfa;}) |
# define NEXT_P1_5 do {KILLS GOTO(*(ip-1));} while(0) |
# define EXEC(XT) ({cfa=(XT); goto **cfa;}) |
# define EXEC1(XT) ({cfa=(XT); *cfa;}) |
#endif |
|
|
|
#if THREADING_SCHEME==6 |
/* direct threaded */ |
#warning indirect threading scheme 6: long latency |
#else |
# define CFA_NEXT |
/* indirect THREADED */ |
# define NEXT_P0 ({cfa=*ip;}) |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ip++; ca=*cfa;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({DEF_CA cfa=(XT); ca=*cfa; goto *ca;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==7 |
|
#warning indirect threading scheme 7: low latency |
|
# define CFA_NEXT |
|
# define NEXT_P0 ({cfa=*ip;}) |
|
# define IP (ip) |
|
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
|
# define NEXT_INST (cfa) |
|
# define INC_IP(const_inc) ({cfa=IP[const_inc]; ip+=(const_inc);}) |
|
# define DEF_CA Label ca; |
|
# define NEXT_P1 ({ip++; ca=*cfa;}) |
|
# define NEXT_P2 ({goto *ca;}) |
|
# define EXEC(XT) ({DEF_CA cfa=(XT); ca=*cfa; goto *ca;}) |
|
#endif |
|
|
|
#if THREADING_SCHEME==8 |
/* #warning indirect threading scheme 8: low latency,cisc */ |
#warning indirect threading scheme 8: low latency,cisc |
|
# define CFA_NEXT |
|
# define NEXT_P0 |
# define NEXT_P0 |
|
# define CFA cfa |
# define IP (ip) |
# define IP (ip) |
# define SET_IP(p) ({ip=(p); NEXT_P0;}) |
# define SET_IP(p) do {ip=(p); NEXT_P0;} while(0) |
# define NEXT_INST (*ip) |
# define NEXT_INST (*ip) |
# define INC_IP(const_inc) ({ip+=(const_inc);}) |
# define INC_IP(const_inc) do {ip+=(const_inc);} while(0) |
# define DEF_CA |
# define DEF_CA |
# define NEXT_P1 |
# define NEXT_P1 |
# define NEXT_P2 ({cfa=*ip++; goto **cfa;}) |
# define NEXT_P1_5 do {cfa=*ip++; GOTO(*cfa);} while(0) |
# define EXEC(XT) ({cfa=(XT); goto **cfa;}) |
# define EXEC1(XT) ({cfa=(XT); *cfa;}) |
#endif |
|
|
|
/* indirect threaded */ |
/* indirect threaded */ |
#endif |
#endif |
|
|
#endif /* !defined(DOUBLY_INDIRECT) */ |
#endif /* !defined(DOUBLY_INDIRECT) && !defined(NO_IP) */ |
|
|
#define NEXT ({DEF_CA NEXT_P1; NEXT_P2;}) |
|
|
|