diff options
Diffstat (limited to 'ext/systemc/src/sysc/qt/md')
52 files changed, 7468 insertions, 0 deletions
diff --git a/ext/systemc/src/sysc/qt/md/axp.1.Makefile b/ext/systemc/src/sysc/qt/md/axp.1.Makefile new file mode 100644 index 000000000..86ccd8f42 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.1.Makefile @@ -0,0 +1,5 @@ + +# +# Compiling for the DEC AXP (alpha) with GNU CC or version 1.x of OSF. +# +CC = cc -std1 -D__AXP__ -D__OSF1__ diff --git a/ext/systemc/src/sysc/qt/md/axp.2.Makefile b/ext/systemc/src/sysc/qt/md/axp.2.Makefile new file mode 100644 index 000000000..268636fc9 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.2.Makefile @@ -0,0 +1,5 @@ + +# +# Compiling for the DEC AXP (alpha) with GNU CC or version 2.x of OSF. +# +CC = cc -std1 -D__AXP__ -D__OSF2__ diff --git a/ext/systemc/src/sysc/qt/md/axp.Makefile b/ext/systemc/src/sysc/qt/md/axp.Makefile new file mode 100644 index 000000000..4e6d74da4 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.Makefile @@ -0,0 +1,5 @@ + +# +# GNU CC +# +CC = gcc -D__AXP__ diff --git a/ext/systemc/src/sysc/qt/md/axp.README b/ext/systemc/src/sysc/qt/md/axp.README new file mode 100644 index 000000000..b6a705c07 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.README @@ -0,0 +1,10 @@ +The handling of varargs is platform-dependent. Assar Westerlund +stared at the problem for a while and deduces the following table: + +vers / compiler cc gcc +---------------------------------------------------------------------- +1.3 a0, offset __base, __offset +2.0 _a0, _offset __base, __offset + +The current code should handle both cc and gcc versions, provided +you configure for the correct compiler. diff --git a/ext/systemc/src/sysc/qt/md/axp.c b/ext/systemc/src/sysc/qt/md/axp.c new file mode 100644 index 000000000..268612993 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.c @@ -0,0 +1,133 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#include <stdarg.h> +#include "qt.h" + + +/* Varargs is harder on the AXP. Parameters are saved on the stack as + something like (stack grows down to low memory; low at bottom of + picture): + + | : + | arg6 + +--- + | iarg5 + | : + | iarg3 <-- va_list._a0 + va_list._offset + | : + | iarg0 <-- va_list._a0 + +--- + | farg5 + | : + | farg0 + +--- + + When some of the arguments have known type, there is no need to + save all of them in the struct. So, for example, if the routine is + called + + zork (int a0, float a1, int a2, ...) + { + va_list ap; + va_start (ap, a2); + qt_vargs (... &ap ...); + } + + then offset is set to 3 * 8 (8 === sizeof machine word) = 24. + + What this means for us is that the user's routine needs to be + called with an arg list where some of the words in the `any type' + parameter list have to be split and moved up in to the int/fp + region. + + Ways in which this can fail: + - The user might not know the size of the pushed arguments anyway. + - Structures have funny promotion rules. + - Probably lots of other things. + + All in all, we never promised varargs would work reliably. */ + + + +#define QUICKTHREADS_VADJ(sp) (((char *)sp) - QUICKTHREADS_VSTKBASE) + +#define QUICKTHREADS_VARGS_MD0(sp, vabytes) \ + ((qt_t *)(((char *)(sp)) - 6*2*8 - QUICKTHREADS_STKROUNDUP(vabytes))) + +extern void qt_vstart(void); +#define QUICKTHREADS_VARGS_MD1(sp) (QUICKTHREADS_SPUT (sp, QUICKTHREADS_R26, qt_vstart)) + + +/* Different machines use different implementations for varargs. + Unfortunately, the code below ``looks in to'' the varargs + structure, `va_list', and thus depends on the conventions. + The following #defines try to deal with it but don't catch + everything. */ + +#ifdef __GNUC__ +#define _a0 __base +#define _offset __offset +#else +#ifdef __OSF1__ +#define _a0 a0 +#define _offset offset +#endif +#endif /* def __GNUC__ */ + + + struct qt_t * +qt_vargs (struct qt_t *qsp, int nbytes, struct va_list *vargs, + void *pt, qt_function_t *startup, + qt_function_t *vuserf, qt_function_t *cleanup) +{ + va_list ap; + int i; + int max; /* Maximum *words* of args to copy. */ + int tmove; /* *Words* of args moved typed->typed. */ + qt_word_t *sp; + + ap = *(va_list *)vargs; + qsp = QUICKTHREADS_VARGS_MD0 (qsp, nbytes); + sp = (qt_word_t *)qsp; + + tmove = 6 - ap._offset/sizeof(qt_word_t); + + /* Copy from one typed area to the other. */ + for (i=0; i<tmove; ++i) { + /* Integer args: */ + sp[i+6] = ((qt_word_t *)(ap._a0 + ap._offset))[i]; + /* Fp args: */ + sp[i] = ((qt_word_t *)(ap._a0 + ap._offset))[i-6]; + } + + max = nbytes/sizeof(qt_word_t); + + /* Copy from the untyped area to the typed area. Split each arg. + in to integer and floating-point save areas. */ + for (; i<6 && i<max; ++i) { + sp[i] = sp[i+6] = ((qt_word_t *)(ap._a0 + ap._offset))[i]; + } + + /* Copy from the untyped area to the other untyped area. */ + for (; i<max; ++i) { + sp[i+6] = ((qt_word_t *)(ap._a0 + ap._offset))[i]; + } + + QUICKTHREADS_VARGS_MD1 (QUICKTHREADS_VADJ(sp)); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VARGT_INDEX, pt); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VSTARTUP_INDEX, startup); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VUSERF_INDEX, vuserf); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VCLEANUP_INDEX, cleanup); + return ((qt_t *)QUICKTHREADS_VADJ(sp)); +} diff --git a/ext/systemc/src/sysc/qt/md/axp.h b/ext/systemc/src/sysc/qt/md/axp.h new file mode 100644 index 000000000..3aac9ff1d --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.h @@ -0,0 +1,160 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_AXP_H +#define QUICKTHREADS_AXP_H + +#define QUICKTHREADS_GROW_DOWN + +typedef unsigned long qt_word_t; + + +/* Stack layout on the Alpha: + + Integer: + + Caller-save: r0..r8, r22..r25, r27..r29 + argument/caller-save: r16..r21 + callee-save: r9..r15 + return pc *callee-save*: r26 + stack pointer: r30 + zero: r31 + + Floating-point: + + Caller-save: f0..f1, f10..f15 + argument/caller-save: f16..f21, f22..f30 + callee-save: f2..f9 + zero: f31 + + Non-varargs: + + +--- + | padding + | f9 + | f8 + | f7 + | f6 + | f5 + | f4 + | f3 + | f2 + | r26 + +--- + | padding + | r29 + | r15 + | r14 + | r13 + | r12 on startup === `only' + | r11 on startup === `userf' + | r10 on startup === `qt' + | r9 on startup === `qu' + | r26 on startup === qt_start <--- qt.sp + +--- + + Conventions for varargs startup: + + | : + | arg6 + | iarg5 + | : + | iarg0 + | farg5 + | : + | farg0 + +--- + | padding + | r29 + | r15 + | r14 + | r13 + | r12 on startup === `startup' + | r11 on startup === `vuserf' + | r10 on startup === `cleanup' + | r9 on startup === `qt' + | r26 on startup === qt_vstart <--- qt.sp + +--- + + Note: this is a pretty cheap/sleazy way to get things going, + but ``there must be a better way.'' For instance, some varargs + parameters could be loaded in to integer registers, or the return + address could be stored on top of the stack. */ + + +/* Stack must be 16-byte aligned. */ +#define QUICKTHREADS_STKALIGN (16) + +/* How much space is allocated to hold all the crud for + initialization: 7 registers times 8 bytes/register. */ + +#define QUICKTHREADS_STKBASE (10 * 8) +#define QUICKTHREADS_VSTKBASE QUICKTHREADS_STKBASE + + +/* Offsets of various registers. */ +#define QUICKTHREADS_R26 0 +#define QUICKTHREADS_R9 1 +#define QUICKTHREADS_R10 2 +#define QUICKTHREADS_R11 3 +#define QUICKTHREADS_R12 4 + + +/* When a never-before-run thread is restored, the return pc points + to a fragment of code that starts the thread running. For + non-vargs functions, it just calls the client's `only' function. + For varargs functions, it calls the startup, user, and cleanup + functions. + + The varargs startup routine always reads 12 8-byte arguments from + the stack. If fewer argumets were pushed, the startup routine + would read off the top of the stack. To prevent errors we always + allocate enough space. When there are fewer args, the preallocated + words are simply wasted. */ + +extern void qt_start(void); +#define QUICKTHREADS_ARGS_MD(sp) (QUICKTHREADS_SPUT (sp, QUICKTHREADS_R26, qt_start)) + + +/* The AXP uses a struct for `va_list', so pass a pointer to the + struct. This may break some uses of `QUICKTHREADS_VARGS', but then we never + claimed it was totally portable. */ + +typedef void (qt_function_t)(void); + +struct qt_t; +struct va_list; +extern struct qt_t *qt_vargs (struct qt_t *sp, int nbytes, + struct va_list *vargs, void *pt, + qt_function_t *startup, + qt_function_t *vuserf, + qt_function_t *cleanup); + +#define QUICKTHREADS_VARGS(sp, nbytes, vargs, pt, startup, vuserf, cleanup) \ + (qt_vargs (sp, nbytes, (struct va_list *)(&(vargs)), pt, \ + (qt_function_t *) startup, (qt_function_t *)vuserf, \ + (qt_function_t *)cleanup)); + + +/* The *index* (positive offset) of where to put each value. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_R12) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_R11) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_R10) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_R9) + +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_R10) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_R11) +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_R12) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_R9) + +#endif /* ndef QUICKTHREADS_AXP_H */ diff --git a/ext/systemc/src/sysc/qt/md/axp.s b/ext/systemc/src/sysc/qt/md/axp.s new file mode 100644 index 000000000..a84aab2cc --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp.s @@ -0,0 +1,160 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* axp.s -- assembly support. */ + + .text + .align 4 + .file 2 "axp.s" + + .globl qt_block + .globl qt_blocki + .globl qt_abort + .globl qt_start + .globl qt_vstart + + /* + ** $16: ptr to function to call once curr is suspended + ** and control is on r19's stack. + ** $17: 1'th arg to (*$16)(...). + ** $18: 2'th arg to (*$16)(...). + ** $19: sp of thread to resume. + ** + ** The helper routine returns a value that is passed on as the + ** return value from the blocking routine. Since we don't + ** touch r0 between the helper's return and the end of + ** function, we get this behavior for free. + */ + + .ent qt_blocki +qt_blocki: + subq $30,80, $30 /* Allocate save area. */ + stq $26, 0($30) /* Save registers. */ + stq $9, 8($30) + stq $10,16($30) + stq $11,24($30) + stq $12,32($30) + stq $13,40($30) + stq $14,48($30) + stq $15,56($30) + stq $29,64($30) + .end qt_blocki + .ent qt_abort +qt_abort: + addq $16,$31, $27 /* Put argument function in PV. */ + addq $30,$31, $16 /* Save stack ptr in outgoing arg. */ + addq $19,$31, $30 /* Set new stack pointer. */ + jsr $26,($27),0 /* Call helper function. */ + + ldq $26, 0($30) /* Restore registers. */ + ldq $9, 8($30) + ldq $10,16($30) + ldq $11,24($30) + ldq $12,32($30) + ldq $13,40($30) + ldq $14,48($30) + ldq $15,56($30) + ldq $29,64($30) + + addq $30,80, $30 /* Deallocate save area. */ + ret $31,($26),1 /* Return, predict===RET. */ + .end qt_abort + + + /* + ** Non-varargs thread startup. + */ + .ent qt_start +qt_start: + addq $9,$31, $16 /* Load up `qu'. */ + addq $10,$31, $17 /* ... user function's `pt'. */ + addq $11,$31, $18 /* ... user function's `userf'. */ + addq $12,$31, $27 /* ... set procedure value to `only'. */ + jsr $26,($27),0 /* Call `only'. */ + + jsr $26,qt_error /* `only' erroniously returned. */ + .end qt_start + + + .ent qt_vstart: +qt_vstart: + /* Call startup function. */ + addq $9,$31, $16 /* Arg0 to `startup'. */ + addq $12,$31, $27 /* Set procedure value. */ + jsr $26,($27),0 /* Call `startup'. */ + + /* Call user function. */ + ldt $f16, 0($30) /* Load fp arg regs. */ + ldt $f17, 8($30) + ldt $f18,16($30) + ldt $f19,24($30) + ldt $f20,32($30) + ldt $f21,40($30) + ldq $16,48($30) /* And integer arg regs. */ + ldq $17,56($30) + ldq $18,64($30) + ldq $19,72($30) + ldq $20,80($30) + ldq $21,88($30) + addq $30,96 $30 /* Pop 6*2*8 saved arg regs. */ + addq $11,$31, $27 /* Set procedure value. */ + jsr $26,($27),0 /* Call `vuserf'. */ + + /* Call cleanup. */ + addq $9,$31, $16 /* Arg0 to `cleanup'. */ + addq $0,$31, $17 /* Users's return value is arg1. */ + addq $10,$31, $27 /* Set procedure value. */ + jsr $26,($27),0 /* Call `cleanup'. */ + + jsr $26,qt_error /* Cleanup erroniously returned. */ + .end qt_start + + + /* + ** Save calle-save floating-point regs $f2..$f9. + ** Also save return pc from whomever called us. + ** + ** Return value from `qt_block' is the same as the return from + ** `qt_blocki'. We get that for free since we don't touch $0 + ** between the return from `qt_blocki' and the return from + ** `qt_block'. + */ + .ent qt_block +qt_block: + subq $30,80, $30 /* Allocate a save space. */ + stq $26, 0($30) /* Save registers. */ + stt $f2, 8($30) + stt $f3,16($30) + stt $f4,24($30) + stt $f5,32($30) + stt $f6,40($30) + stt $f7,48($30) + stt $f8,56($30) + stt $f9,64($30) + + jsr $26,qt_blocki /* Call helper. */ + /* .. who will also restore $gp. */ + + ldq $26, 0($30) /* restore registers. */ + ldt $f2, 8($30) + ldt $f3,16($30) + ldt $f4,24($30) + ldt $f5,32($30) + ldt $f6,40($30) + ldt $f7,48($30) + ldt $f8,56($30) + ldt $f9,64($30) + + addq $30,80, $30 /* Deallcate save space. */ + ret $31,($26),1 /* Return, predict===RET. */ + .end qt_block diff --git a/ext/systemc/src/sysc/qt/md/axp_b.s b/ext/systemc/src/sysc/qt/md/axp_b.s new file mode 100644 index 000000000..60be726ff --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/axp_b.s @@ -0,0 +1,111 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .text + .globl b_call_reg + .globl b_call_imm + .globl b_add + .globl b_load + + .ent b_null +b_null: + ret $31,($18),1 + .end b_null + + .ent b_call_reg +b_call_reg: + lda $27,b_null +$L0: + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + jsr $18,($27) + + subq $16,1,$16 + bgt $16,$L0 + + ret $31,($26),1 + .end + + + .ent b_call_imm +b_call_imm: +$L1: + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + jsr $18,b_null + + subq $16,1,$16 + bgt $16,$L1 + + ret $31,($26),1 + .end + + + .ent b_add +b_add: +$L2: + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + addq $31,$31,$31 + + subq $16,1,$16 + bgt $16,$L2 + + ret $31,($26),1 + .end + + + .ent b_load +b_load: +$L3: + ldq $31,0($30) + ldq $31,8($30) + ldq $31,16($30) + ldq $31,24($30) + ldq $31,32($30) + + ldq $31,0($30) + ldq $31,8($30) + ldq $31,16($30) + ldq $31,24($30) + ldq $31,32($30) + + subq $16,1,$16 + bgt $16,$L3 + + ret $31,($26),1 + .end diff --git a/ext/systemc/src/sysc/qt/md/default.Makefile b/ext/systemc/src/sysc/qt/md/default.Makefile new file mode 100644 index 000000000..2f3ded151 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/default.Makefile @@ -0,0 +1,8 @@ + +# +# `Normal' configuration. +# +CC = gcc -ansi -Wall -pedantic + +.o.s: + as -o $@ $< diff --git a/ext/systemc/src/sysc/qt/md/hppa-cnx.Makefile b/ext/systemc/src/sysc/qt/md/hppa-cnx.Makefile new file mode 100644 index 000000000..bff257d9f --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/hppa-cnx.Makefile @@ -0,0 +1,9 @@ +# This file (cnx_spp.Makefile) is part of the port of QuickThreads for +# PA-RISC 1.1 architecture on a Convex SPP. This file is a machine dependent +# makefile for QuickThreads. It was written in 1994 by Uwe Reder +# (`uereder@cip.informatik.uni-erlangen.de') for the Operating Systems +# Department (IMMD4) at the University of Erlangen/Nuernberg Germany. + +# `Normal' configuration. + +CC = /usr/convex/bin/cc diff --git a/ext/systemc/src/sysc/qt/md/hppa.Makefile b/ext/systemc/src/sysc/qt/md/hppa.Makefile new file mode 100644 index 000000000..bf770ae3b --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/hppa.Makefile @@ -0,0 +1,12 @@ +# This file (pa-risc.Makefile) is part of the port of QuickThreads for +# PA-RISC 1.1 architecture. This file is a machine dependent makefile +# for QuickThreads. It was written in 1994 by Uwe Reder +# (`uereder@cip.informatik.uni-erlangen.de') for the Operating Systems +# Department (IMMD4) at the University of Erlangen/Nuernberg Germany. + +# `Normal' configuration. + +CC = cc -Aa + +.s.o: + /usr/ccs/bin/as -o $@ $< diff --git a/ext/systemc/src/sysc/qt/md/hppa.h b/ext/systemc/src/sysc/qt/md/hppa.h new file mode 100644 index 000000000..fdb9cef93 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/hppa.h @@ -0,0 +1,196 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* + * This file (pa-risc.h) is part of the port of QuickThreads for the + * PA-RISC 1.1 architecture. This file is a machine dependent header + * file. It was written in 1994 by Uwe Reder + * (`uereder@cip.informatik.uni-erlangen.de') for the Operating Systems + * Department (IMMD4) at the University of Erlangen/Nuernberg Germany. + */ + + +#ifndef QUICKTHREADS_PA_RISC_H +#define QUICKTHREADS_PA_RISC_H + +#if 0 +#include <qt.h> +#endif + +/* size of an integer-register (32 bit) */ +typedef unsigned long qt_word_t; + +/* PA-RISC's stack grows up */ +#define QUICKTHREADS_GROW_UP + +/* Stack layout on PA-RISC according to PA-RISC Procedure Calling Conventions: + + Callee-save registers are: gr3-gr18, fr12-fr21. + Also save gr2, return pointer. + + +--- + | fr12 Each floating register is a double word (8 bytes). + | fr13 Floating registers are only saved if `qt_block' is + | fr14 called, in which case it saves the floating-point + | fr15 registers then calls `qt_blocki' to save the integer + | fr16 registers. + | fr17 + | fr18 + | fr19 + | fr20 + | fr21 + | <arg word 3> fixed arguments (must be allocated; may remain unused) + | <arg word 2> + | <arg word 1> + | <arg word 0> + | <LPT> frame marker + | <LPT'> + | <RP'> + | <Current RP> + | <Static Link> + | <Clean Up> + | <RP''> + | <Previous SP> + +--- + | gr3 word each (4 bytes) + | gr4 + | gr5 + | gr6 + | gr7 + | gr8 + | gr9 + | gr10 + | gr11 + | gr12 + | gr13 + | gr14 + | gr15 + | gr16 + | gr17 + | gr18 + | <16 bytes filled in (sp has to be 64-bytes aligned)> + | <arg word 3> fixed arguments (must be allocated; may remain unused) + | <arg word 2> + | <arg word 1> + | <arg word 0> + | <LPT> frame marker + | <LPT'> + | <RP'> + | <Current RP> + | <Static Link> + | <Clean Up> + | <RP''> + | <Previous SP> + +--- <--- sp +*/ + +/* When a never-before-run thread is restored, the return pc points + to a fragment of code that starts the thread running. For + non-vargs functions, it just calls the client's `only' function. + For varargs functions, it calls the startup, user, and cleanup + functions. */ + +/* Note: Procedue Labels on PA-RISC + + <--2--><-------28---------><1-><1-> + ----------------------------------- + | SID | Adress Part | L | X | + ----------------------------------- + + On HP-UX the L field is used to flag wheather the procedure + label (plabel) is a pointer to an LT entry or to the entry point + of the procedure (PA-RISC Procedure Calling Conventions Reference + Manual, 5.3.2 Procedure Labels and Dynamic Calls). */ + +#define QUICKTHREADS_PA_RISC_READ_PLABEL(plabel) \ + ( (((int)plabel) & 2) ? \ + ( (*((int *)(((int)plabel) & 0xfffffffc)))) : ((int)plabel) ) + +/* Stack must be 64 bytes aligned. */ +#define QUICKTHREADS_STKALIGN (64) + +/* Internal helper for putting stuff on stack (negative index!). */ +#define QUICKTHREADS_SPUT(top, at, val) \ + (((qt_word_t *)(top))[-(at)] = (qt_word_t)(val)) + +/* Offsets of various registers which are modified on the stack. + rp (return-pointer) has to be stored in the frame-marker-area + of the "older" stack-segment. */ + +#define QUICKTHREADS_crp (12+4+16+5) +#define QUICKTHREADS_15 (12+4+4) +#define QUICKTHREADS_16 (12+4+3) +#define QUICKTHREADS_17 (12+4+2) +#define QUICKTHREADS_18 (12+4+1) + + +/** This stuff is for NON-VARARGS. **/ + +/* Stack looks like this (2 stack frames): + + <--- 64-bytes aligned --><------- 64-bytes aligned ------------> + | || | + <--16--><------48-------><----16*4-----><--16-><------48-------> + || | || | | || + ||filler|arg|frame-marker||register-save|filler|arg|frame-marker|| + ------------------------------------------------------------------ + */ + +#define QUICKTHREADS_STKBASE (16+48+(16*sizeof(qt_word_t))+16+48) + +/* The index, relative to sp, of where to put each value. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_15) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_16) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_17) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_18) + +extern void qt_start(void); +#define QUICKTHREADS_ARGS_MD(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_crp, QUICKTHREADS_PA_RISC_READ_PLABEL(qt_start))) + + +/** This is for VARARGS. **/ + +#define QUICKTHREADS_VARGS_DEFAULT + +/* Stack looks like this (2 stack frames): + + <------ 64-bytes aligned -------><--------- 64-bytes aligned ----------> + | || | + <---?--><--?---><16><----32-----><----16*4-----><-16--><16><----32-----> + || | | | || | | | || + ||filler|varargs|arg|frame-marker||register-save|filler|arg|frame-marker|| + -------------------------------------------------------------------------- + */ + +/* Sp is moved to the end of the first stack frame. */ +#define QUICKTHREADS_VARGS_MD0(sp, vasize) \ + ((qt_t *)(((char *)sp) + QUICKTHREADS_STKROUNDUP(vasize + 4*4 + 32))) + +/* To reach the arguments from the end of the first stack frame use 32 + as a negative adjustment. */ +#define QUICKTHREADS_VARGS_ADJUST(sp) ((qt_t *)(((char *)sp) - 32)) + +/* Offset to reach the end of the second stack frame. */ +#define QUICKTHREADS_VSTKBASE ((16*sizeof(qt_word_t)) + 16 + 4*4 + 32) + +extern void qt_vstart(void); +#define QUICKTHREADS_VARGS_MD1(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_crp, QUICKTHREADS_PA_RISC_READ_PLABEL(qt_vstart))) + +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_15) +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_16) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_17) +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_18) + +#endif /* ndef QUICKTHREADS_PA_RISC_H */ diff --git a/ext/systemc/src/sysc/qt/md/hppa.s b/ext/systemc/src/sysc/qt/md/hppa.s new file mode 100644 index 000000000..84d8e875b --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/hppa.s @@ -0,0 +1,237 @@ +; pa-risc.s -- assembly support. + +; QuickThreads -- Threads-building toolkit. +; Copyright (c) 1993 by David Keppel +; +; Permission to use, copy, modify and distribute this software and +; its documentation for any purpose and without fee is hereby +; granted, provided that the above copyright notice and this notice +; appear in all copies. This software is provided as a +; proof-of-concept and for demonstration purposes; there is no +; representation about the suitability of this software for any +; purpose. + +; This file (pa-risc.s) is part of the port of QuickThreads for +; PA-RISC 1.1 architecture. This file implements context switches +; and thread startup. It was written in 1994 by Uwe Reder +; (`uereder@cip.informatik.uni-erlangen.de') for the Operating +; Systems Department (IMMD4) at the University of Erlangen/Nuernberg +; Germany. + + +; Callee saves general registers gr3..gr18, +; floating-point registers fr12..fr21. + + .CODE + + .IMPORT $$dyncall, MILLICODE + .IMPORT qt_error, CODE + + .EXPORT qt_blocki, ENTRY + .EXPORT qt_block, ENTRY + .EXPORT qt_abort, ENTRY + .EXPORT qt_start, ENTRY + .EXPORT qt_vstart, ENTRY + + +; arg0: ptr to function (helper) to call once curr is suspended +; and control is on arg3's stack. +; arg1: 1'th arg to *arg0. +; arg2: 2'th arg to *arg0. +; arg3: sp of new thread. + +qt_blocki + .PROC + .CALLINFO CALLER, FRAME=0, SAVE_RP, ENTRY_GR=18 + .ENTRY + + stw %rp,-20(%sp) ; save rp to old frame-marker + + stwm %r3,128(%sp) ; save callee-saves general registers + stw %r4,-124(%sp) + stw %r5,-120(%sp) + stw %r6,-116(%sp) + stw %r7,-112(%sp) + stw %r8,-108(%sp) + stw %r9,-104(%sp) + stw %r10,-100(%sp) + stw %r11,-96(%sp) + stw %r12,-92(%sp) + stw %r13,-88(%sp) + stw %r14,-84(%sp) + stw %r15,-80(%sp) + stw %r16,-76(%sp) + stw %r17,-72(%sp) + stw %r18,-68(%sp) + +qt_abort + copy %arg0,%r22 ; helper to be called by $$dyncall + copy %sp,%arg0 ; pass current sp as arg0 to helper + copy %arg3,%sp ; set new sp + + .CALL + bl $$dyncall,%mrp ; call helper + copy %mrp,%rp + + ldw -68(%sp),%r18 ; restore general registers + ldw -72(%sp),%r17 + ldw -76(%sp),%r16 + ldw -80(%sp),%r15 + ldw -84(%sp),%r14 + ldw -88(%sp),%r13 + ldw -92(%sp),%r12 + ldw -96(%sp),%r11 + ldw -100(%sp),%r10 + ldw -104(%sp),%r9 + ldw -108(%sp),%r8 + ldw -112(%sp),%r7 + ldw -116(%sp),%r6 + ldw -120(%sp),%r5 + ldw -124(%sp),%r4 + + ldw -148(%sp),%rp ; restore return-pointer + + bv %r0(%rp) ; return to caller + ldwm -128(%sp),%r3 + + .EXIT + .PROCEND + + +qt_block + .PROC + .CALLINFO CALLER, FRAME=0, SAVE_RP, ENTRY_FR=21 + .ENTRY + + stw %rp,-20(%sp) ; save rp to old frame-marker + + fstds,ma %fr12,8(%sp) ; save callee-saves float registers + fstds,ma %fr13,8(%sp) + fstds,ma %fr14,8(%sp) + fstds,ma %fr15,8(%sp) + fstds,ma %fr16,8(%sp) + fstds,ma %fr17,8(%sp) + fstds,ma %fr18,8(%sp) + fstds,ma %fr19,8(%sp) + fstds,ma %fr20,8(%sp) + fstds,ma %fr21,8(%sp) + + .CALL + bl qt_blocki,%rp + ldo 48(%sp),%sp + + ldo -48(%sp),%sp + + fldds,mb -8(%sp),%fr21 ; restore callee-saves float registers + fldds,mb -8(%sp),%fr20 + fldds,mb -8(%sp),%fr19 + fldds,mb -8(%sp),%fr18 + fldds,mb -8(%sp),%fr17 + fldds,mb -8(%sp),%fr16 + fldds,mb -8(%sp),%fr15 + fldds,mb -8(%sp),%fr14 + fldds,mb -8(%sp),%fr13 + + ldw -28(%sp),%rp ; restore return-pointer + + bv %r0(%rp) ; return to caller. + fldds,mb -8(%sp),%fr12 + + .EXIT + .PROCEND + + +qt_start + .PROC + .CALLINFO CALLER, FRAME=0 + .ENTRY + + copy %r18,%arg0 ; set user arg `pu'. + copy %r17,%arg1 ; ... user function pt. + copy %r16,%arg2 ; ... user function userf. + ; %r22 is a caller-saves register + copy %r15,%r22 ; function to be called by $$dyncall + + .CALL ; in=%r22 + bl $$dyncall,%mrp ; call `only'. + copy %mrp,%rp + + bl,n qt_error,%r0 ; `only' erroniously returned. + + .EXIT + .PROCEND + + +; Varargs +; +; First, call `startup' with the `pt' argument. +; +; Next, call the user's function with all arguments. +; We don't know whether arguments are integers, 32-bit floating-points or +; even 64-bit floating-points, so we reload all the registers, possibly +; with garbage arguments. The thread creator provided non-garbage for +; the arguments that the callee actually uses, so the callee never gets +; garbage. +; +; -48 -44 -40 -36 -32 +; | arg3 | arg2 | arg1 | arg0 | +; ----------------------------- +; integers: arg3 arg2 arg1 arg0 +; 32-bit fps: farg3 farg2 farg1 farg0 +; 64-bit fps: <---farg3--> <---farg1--> +; +; Finally, call `cleanup' with the `pt' argument and with the return value +; from the user's function. It is an error for `cleanup' to return. + +qt_vstart + .PROC + .CALLINFO CALLER, FRAME=0 + .ENTRY + + ; Because the startup function may damage the fixed arguments + ; on the stack (PA-RISC Procedure Calling Conventions Reference + ; Manual, 2.4 Fixed Arguments Area), we allocate a seperate + ; stack frame for it. + ldo 64(%sp),%sp + + ; call: void startup(void *pt) + + copy %r15,%arg0 ; `pt' is arg0 to `startup'. + copy %r16,%r22 + .CALL + bl $$dyncall,%mrp ; Call `startup'. + copy %mrp,%rp + + ldo -64(%sp),%sp + + ; call: void *qt_vuserf_t(...) + + ldw -36(%sp),%arg0 ; Load args to integer registers. + ldw -40(%sp),%arg1 + ldw -44(%sp),%arg2 + ldw -48(%sp),%arg3 + ; Index of fld[w|d]s only ranges from -16 to 15, so we + ; take r22 to be our new base register. + ldo -32(%sp),%r22 + fldws -4(%r22),%farg0 ; Load args to floating-point registers. + fldds -8(%r22),%farg1 + fldws -12(%r22),%farg2 + fldds -16(%r22),%farg3 + copy %r17,%r22 + .CALL + bl $$dyncall,%mrp ; Call `userf'. + copy %mrp,%rp + + ; call: void cleanup(void *pt, void *vuserf_return) + + copy %r15,%arg0 ; `pt' is arg0 to `cleanup'. + copy %ret0,%arg1 ; Return-value is arg1 to `cleanup'. + copy %r18,%r22 + .CALL + bl $$dyncall,%mrp ; Call `cleanup'. + copy %mrp,%rp + + bl,n qt_error,%r0 + + .EXIT + .PROCEND diff --git a/ext/systemc/src/sysc/qt/md/hppa_b.s b/ext/systemc/src/sysc/qt/md/hppa_b.s new file mode 100644 index 000000000..1b1e8264e --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/hppa_b.s @@ -0,0 +1,203 @@ +; QuickThreads -- Threads-building toolkit. +; Copyright (c) 1993 by David Keppel + +; Permission to use, copy, modify and distribute this software and +; its documentation for any purpose and without fee is hereby +; granted, provided that the above copyright notice and this notice +; appear in all copies. This software is provided as a +; proof-of-concept and for demonstration purposes; there is no +; representation about the suitability of this software for any +; purpose. + +; This file (pa-risc_b.s) is part of the port of QuickThreads for +; PA-RISC 1.1 architecture. It contains assembly-level support for +; raw processor performance measurement. It was written in 1994 by +; Uwe Reder (`uereder@cip.informatik.uni-erlangen.de') +; for the Operating Systems Department (IMMD4) at the +; University of Erlangen/Nuernberg Germany. + + +; Note that the number of instructions in the measurement-loops, differ +; from implementation to implementation. I took eight instructions in a loop +; for every test (execute eight instructions and loop to the start). + + .CODE + + .IMPORT $global$,DATA + .IMPORT $$dyncall,MILLICODE + .EXPORT b_call_reg + .EXPORT b_call_imm + .EXPORT b_add + .EXPORT b_load + +; Just do nothing, only return to caller. This procedure is called by +; `b_call_reg' and `b_call_imm'. + +b_null + .PROC + .CALLINFO NO_CALLS, FRAME=0 + .ENTRY + + bv,n %r0(%rp) ; just return + + .EXIT + .PROCEND + +; Call the procedure `b_null' with function pointer in a register. + +b_call_reg + .PROC + .CALLINFO CALLER, FRAME=0 + .ENTRY + + stwm %r3,64(%sp) ; store r3 (may be used by caller) + stw %rp,-20(%sp) ; save return-pointer to frame-marker + + addil LR'to_call-$global$,%r27 + ldw RR'to_call-$global$(%r1),%r3 + +_loop0 + copy %r3,%r22 ; copy the procedure label to r22, ... + .CALL ; ...this is the input to $$dyncall + bl $$dyncall,%mrp ; call $$dyncall (millicode function) + copy %mrp,%rp ; remember the return-pointer + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + copy %r3,%r22 + .CALL + bl $$dyncall,%mrp + copy %mrp,%rp + + addibf,<= -8,%arg0,_loop0 ; decrement counter by 8 and loop + nop + + ldw -20(%sp),%rp ; restore return-pointer + bv %r0(%rp) ; return to caller + ldwm -64(%sp),%r3 ; resore r3 and remove stack frame + + .EXIT + .PROCEND + +; Call the procedure `b_null' immediate. + +b_call_imm + .PROC + .CALLINFO CALLER, FRAME=0, SAVE_RP + .ENTRY + + ldo 64(%sp),%sp ; caller needs a stack-frame + stw %rp,-20(%sp) ; save return-pointer to frame-marker + +_loop1 + bl b_null,%rp ; call `b_null' immediate (8 times) + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + bl b_null,%rp + nop + + addibf,<= -8,%arg0,_loop1 ; decrement counter by 8 and loop + nop + + ldw -20(%sp),%rp ; restore return-pointer + bv %r0(%rp) ; return to caller + ldo -64(%sp),%sp ; remove stack-frame + + .EXIT + .PROCEND + +; Copy register-to-register. +; On PA-RISC this is implemented with an `or'. +; The `or' is hidden by a pseudo-operation called `copy'. + +b_add + .PROC + .CALLINFO NO_CALLS, FRAME=0 + .ENTRY + +_loop2 + copy %r19,%r20 ; copy register-to-register + copy %r20,%r21 ; use caller-saves registers + copy %r21,%r22 + copy %r22,%r21 + copy %r21,%r20 + copy %r20,%r19 + copy %r19,%r20 + copy %r20,%r21 + + addibf,<= -8,%arg0,_loop2 ; decrement counter by 8 and loop + nop + + bv,n %r0(%rp) + + .EXIT + .PROCEND + +; Load memory to a register. + +b_load + .PROC + .CALLINFO NO_CALLS, FRAME=0 + .ENTRY + +_loop3 + ldw -4(%sp),%r22 ; load data from frame-marker + ldw -8(%sp),%r22 ; use a caller-saves register + ldw -12(%sp),%r22 + ldw -16(%sp),%r22 + ldw -20(%sp),%r22 + ldw -24(%sp),%r22 + ldw -28(%sp),%r22 + ldw -32(%sp),%r22 + + addibf,<= -8,%arg0,_loop3 ; decrement counter by 8 and loop + nop + + bv,n %r0(%rp) + + .EXIT + .PROCEND + + + .ALIGN 8 +to_call + .WORD b_null diff --git a/ext/systemc/src/sysc/qt/md/i386.README b/ext/systemc/src/sysc/qt/md/i386.README new file mode 100644 index 000000000..8ffb92198 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/i386.README @@ -0,0 +1,7 @@ +Note that some machines want labels to have leading underscores, +while others (e.g. System V) do not. Thus, several labels appear +duplicated except for the leading underscore, e.g. + + _qt_cswap: + qt_cswap: + diff --git a/ext/systemc/src/sysc/qt/md/i386.h b/ext/systemc/src/sysc/qt/md/i386.h new file mode 100644 index 000000000..04513857e --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/i386.h @@ -0,0 +1,132 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_386_H +#define QUICKTHREADS_386_H + +typedef unsigned long qt_word_t; + +/* Thread's initial stack layout on the i386: + + non-varargs: + + +--- + | arg[2] === `userf' on startup + | arg[1] === `pt' on startup + | arg[0] === `pu' on startup + +--- + | ret pc === qt_error + +--- + | ret pc === `only' on startup + +--- + | %ebp + | %esi + | %edi + | %ebx <--- qt_t.sp + +--- + + When a non-varargs thread is started, it ``returns'' directly to + the client's `only' function. + + varargs: + + +--- + | arg[n-1] + | .. + | arg[0] + +--- + | ret pc === `qt_vstart' + +--- + | %ebp === `startup' + | %esi === `cleanup' + | %edi === `pt' + | %ebx === `vuserf' <--- qt_t.sp + +--- + + When a varargs thread is started, it ``returns'' to the `qt_vstart' + startup code. The startup code calls the appropriate functions. */ + + +/* What to do to start a varargs thread running. */ +extern void qt_vstart (void); + + +/* Hold 4 saved regs plus two return pcs (qt_error, qt_start) plus + three args. */ +#define QUICKTHREADS_STKBASE (13 * 4) + +/* Hold 4 saved regs plus one return pc (qt_vstart). */ +#define QUICKTHREADS_VSTKBASE (5 * 4) + + +/* Stack must be 16-byte aligned at function call instr. (SSE data support) */ +#define QUICKTHREADS_STKALIGN (16) + + +/* Where to place various arguments. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_PC) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_ARG2) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_ARG1) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_ARG0) + +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_EBP) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_EBX) +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_ESI) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_EDI) + + +#define QUICKTHREADS_EBX 0 +#define QUICKTHREADS_EDI 1 +#define QUICKTHREADS_ESI 2 +#define QUICKTHREADS_EBP 3 +#define QUICKTHREADS_POP0 4 +#define QUICKTHREADS_POP1 5 +#define QUICKTHREADS_POP2 6 +#define QUICKTHREADS_PC 7 +/* The following are defined only for non-varargs. */ +#define QUICKTHREADS_POPE 8 +#define QUICKTHREADS_ARG0 9 +#define QUICKTHREADS_ARG1 10 +#define QUICKTHREADS_ARG2 11 +#define QUICKTHREADS_RPC 12 + + +/* Stack grows down. The top of the stack is the first thing to + pop off (preincrement, postdecrement). */ +#define QUICKTHREADS_GROW_DOWN + +extern void qt_error (void); + +/* For correct 16-byte stack alignment (auto-relocatable functions) */ +extern void qt_tramp (void); +extern void qt_align (void); + +/* Push on the error return address and the alignment/trampoline functions. */ +#define QUICKTHREADS_ARGS_MD(sto) \ + (QUICKTHREADS_SPUT (sto, QUICKTHREADS_POP0, qt_align), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_POP1, qt_align), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_POP2, qt_align), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_POPE, qt_tramp), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_RPC, qt_error)) + + +/* When varargs are pushed, allocate space for all the args. */ +#define QUICKTHREADS_VARGS_MD0(sto, nbytes) \ + ((qt_t *)(((char *)(sto)) - QUICKTHREADS_STKROUNDUP(nbytes))) + +#define QUICKTHREADS_VARGS_MD1(sto) \ + (QUICKTHREADS_SPUT (sto, QUICKTHREADS_PC, qt_vstart)) + +#define QUICKTHREADS_VARGS_DEFAULT + +#endif /* QUICKTHREADS_386_H */ diff --git a/ext/systemc/src/sysc/qt/md/i386.s b/ext/systemc/src/sysc/qt/md/i386.s new file mode 100644 index 000000000..b5806cd27 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/i386.s @@ -0,0 +1,119 @@ +/* i386.s -- assembly support. */ + +/* +// QuickThreads -- Threads-building toolkit. +// Copyright (c) 1993 by David Keppel +// +// Permission to use, copy, modify and distribute this software and +// its documentation for any purpose and without fee is hereby +// granted, provided that the above copyright notice and this notice +// appear in all copies. This software is provided as a +// proof-of-concept and for demonstration purposes; there is no +// representation about the suitability of this software for any +// purpose. */ + +/* NOTE: double-labeled `_name' and `name' for System V compatability. */ +/* NOTE: Mixed C/C++-style comments used. Sorry! */ + +/* Callee-save: %esi, %edi, %ebx, %ebp +// Caller-save: %eax, %ecx +// Can't tell: %edx (seems to work w/o saving it.) +// +// Assignment: +// +// See ``i386.h'' for the somewhat unconventional stack layout. */ + + + .text + .align 2 + + .globl _qt_abort + .globl qt_abort + .globl _qt_block + .globl qt_block + .globl _qt_blocki + .globl qt_blocki + .globl _qt_align + .globl qt_align + +/* These all have the type signature +// +// void *blocking (helper, arg0, arg1, new) +// +// On procedure entry, the helper is at 4(sp), args at 8(sp) and +// 12(sp) and the new thread's sp at 16(sp). It *appears* that the +// calling convention for the 8X86 requires the caller to save all +// floating-point registers, this makes our life easy. */ + +/* Halt the currently-running thread. Save it's callee-save regs on +// to the stack, 32 bytes. Switch to the new stack (next == 16+32(sp)) +// and call the user function (f == 4+32(sp) with arguments: old sp +// arg1 (8+32(sp)) and arg2 (12+32(sp)). When the user function is +// done, restore the new thread's state and return. +// +// `qt_abort' is (currently) an alias for `qt_block' because most of +// the work is shared. We could save the insns up to `qt_common' by +// replicating, but w/o replicating we need an inital subtract (to +// offset the stack as if it had been a qt_block) and then a jump +// to qt_common. For the cost of a jump, we might as well just do +// all the work. +// +// The helper function (4(sp)) can return a void* that is returned +// by the call to `qt_blockk{,i}'. Since we don't touch %eax in +// between, we get that ``for free''. */ + +_qt_abort: +qt_abort: +_qt_block: +qt_block: +_qt_blocki: +qt_blocki: + pushl %ebp /* Save callee-save, sp-=4. */ + pushl %esi /* Save callee-save, sp-=4. */ + pushl %edi /* Save callee-save, sp-=4. */ + pushl %ebx /* Save callee-save, sp-=4. */ + movl %esp, %eax /* Remember old stack pointer. */ + +qt_common: + movl 32(%esp), %esp /* Move to new thread. */ + pushl 28(%eax) /* Push arg 2. */ + pushl 24(%eax) /* Push arg 1. */ + pushl %eax /* Push arg 0. */ + movl 20(%eax), %ebx /* Get function to call. */ + call *%ebx /* Call f. */ + addl $12, %esp /* Pop args. */ + + popl %ebx /* Restore callee-save, sp+=4. */ + popl %edi /* Restore callee-save, sp+=4. */ + popl %esi /* Restore callee-save, sp+=4. */ + popl %ebp /* Restore callee-save, sp+=4. */ +_qt_align: +qt_align: + ret /* Resume the stopped function. */ + + .globl _qt_tramp + .globl qt_tramp +_qt_tramp: +qt_tramp: + movl 12(%esp), %eax /* Load 'qt_error' address */ + sub $4, %esp /* Align stack pointer to 16-byte boundary */ + jmp *%eax /* call 'qt_error' */ + hlt /* 'qt_error' never returns */ + +/* Start a varargs thread. */ + + .globl _qt_vstart + .globl qt_vstart +_qt_vstart: +qt_vstart: + pushl %edi /* Push `pt' arg to `startup'. */ + call *%ebp /* Call `startup'. */ + popl %eax /* Clean up the stack. */ + + call *%ebx /* Call the user's function. */ + + pushl %eax /* Push return from user's. */ + pushl %edi /* Push `pt' arg to `cleanup'. */ + call *%esi /* Call `cleanup'. */ + + hlt /* `cleanup' never returns. */ diff --git a/ext/systemc/src/sysc/qt/md/i386_b.s b/ext/systemc/src/sysc/qt/md/i386_b.s new file mode 100644 index 000000000..32129a5d1 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/i386_b.s @@ -0,0 +1,30 @@ +/* +// QuickThreads -- Threads-building toolkit. +// Copyright (c) 1993 by David Keppel +// +// Permission to use, copy, modify and distribute this software and +// its documentation for any purpose and without fee is hereby +// granted, provided that the above copyright notice and this notice +// appear in all copies. This software is provided as a +// proof-of-concept and for demonstration purposes; there is no +// representation about the suitability of this software for any +// purpose. */ + + .globl _b_call_reg + .globl b_call_reg + .globl _b_call_imm + .globl b_call_imm + .globl _b_add + .globl b_add + .globl _b_load + .globl b_load + +_b_call_reg: +b_call_reg: +_b_call_imm: +b_call_imm: +_b_add: +b_add: +_b_load: +b_load: + hlt diff --git a/ext/systemc/src/sysc/qt/md/iX86_64.h b/ext/systemc/src/sysc/qt/md/iX86_64.h new file mode 100644 index 000000000..97bfe39b4 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/iX86_64.h @@ -0,0 +1,140 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_X86_64_H +#define QUICKTHREADS_X86_64_H + +typedef unsigned long qt_word_t; + +/* Thread's initial stack layout on the iX86_64: + + non-varargs: + + +--- + | arg[2] === `userf' on startup + | arg[1] === `pt' on startup + | arg[0] === `pu' on startup + +--- + | ret pc === qt_error + +--- + | ret pc === `only' on startup + +--- + | %ebp + | %esi + | %edi + | %ebx <--- qt_t.sp + +--- + + When a non-varargs thread is started, it ``returns'' directly to + the client's `only' function. + + varargs: + + +--- + | arg[n-1] + | .. + | arg[0] + +--- + | ret pc === `qt_vstart' + +--- + | %ebp === `startup' + | %esi === `cleanup' + | %edi === `pt' + | %ebx === `vuserf' <--- qt_t.sp + +--- + + When a varargs thread is started, it ``returns'' to the `qt_vstart' + startup code. The startup code calls the appropriate functions. */ + + +/* What to do to start a varargs thread running. */ +extern void qt_vstart (void); + + +/* Hold four return pcs (qt_error, qt_start and twice qt_align) + plus ten args and two qt_word_t's for correct alignment. */ +#define QUICKTHREADS_STKBASE (16 * sizeof(long)) + +/* Hold 4 saved regs plus one return pc (qt_vstart). */ +#define QUICKTHREADS_VSTKBASE (5 * sizeof(long)) + + +/* Stack must be 16-byte aligned at function call instr. (SSE data support) */ +#define QUICKTHREADS_STKALIGN (16) + + +/* Where to place various arguments. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_PC) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_ARG2) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_ARG1) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_ARG0) + +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_EBP) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_EBX) +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_ESI) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_EDI) + + +/* Stack layout offsets relative to stack at initial stack setup. */ + +/* Stack alignment 15 */ +#define QUICKTHREADS_RPC 14 +#define QUICKTHREADS_POP0 13 +#define QUICKTHREADS_PC 12 +#define QUICKTHREADS_POP1 11 +#define QUICKTHREADS_RBP 10 +/* Stack alignment 9 */ +#define QUICKTHREADS_R12 8 +#define QUICKTHREADS_R13 7 +#define QUICKTHREADS_R14 6 +#define QUICKTHREADS_R15 5 +#define QUICKTHREADS_RBX 4 +#define QUICKTHREADS_RCX 3 +#define QUICKTHREADS_RDX 2 +#define QUICKTHREADS_RDI 1 +#define QUICKTHREADS_RSI 0 + + +/* Arguments to save stack function. */ + +#define QUICKTHREADS_ARG0 QUICKTHREADS_RDI +#define QUICKTHREADS_ARG1 QUICKTHREADS_RSI +#define QUICKTHREADS_ARG2 QUICKTHREADS_RDX + + +/* Stack grows down. The top of the stack is the first thing to + pop off (preincrement, postdecrement). */ +#define QUICKTHREADS_GROW_DOWN + +extern void qt_error (void); +extern void qt_align (void); /* For correct stack alignment */ + +/* Push on the error return address, force Frame Pointer to 0 and + push stack alignment trampoline function. */ +#define QUICKTHREADS_ARGS_MD(sto) \ + (QUICKTHREADS_SPUT (sto, QUICKTHREADS_RBP, 0), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_POP0, qt_align), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_POP1, qt_align), \ + QUICKTHREADS_SPUT (sto, QUICKTHREADS_RPC, qt_error)) + + +/* When varargs are pushed, allocate space for all the args. */ +#define QUICKTHREADS_VARGS_MD0(sto, nbytes) \ + ((qt_t *)(((char *)(sto)) - QUICKTHREADS_STKROUNDUP(nbytes))) + +#define QUICKTHREADS_VARGS_MD1(sto) \ + (QUICKTHREADS_SPUT (sto, QUICKTHREADS_PC, qt_vstart)) + +#define QUICKTHREADS_VARGS_DEFAULT + +#endif /* QUICKTHREADS_X86_64_H */ diff --git a/ext/systemc/src/sysc/qt/md/iX86_64.s b/ext/systemc/src/sysc/qt/md/iX86_64.s new file mode 100644 index 000000000..a8bcfcd96 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/iX86_64.s @@ -0,0 +1,74 @@ +/* iX386_64.s -- assembly support. */ + +/* +// QuickThreads -- Threads-building toolkit. +// Copyright (c) 1993 by David Keppel +// +// Permission to use, copy, modify and distribute this software and +// its documentation for any purpose and without fee is hereby +// granted, provided that the above copyright notice and this notice +// appear in all copies. This software is provided as a +// proof-of-concept and for demonstration purposes; there is no +// representation about the suitability of this software for any +// purpose. */ + +/* 64-bit Intel Architecture Support +// written by Andy Goodrich, Forte Design Systms, Inc. */ + +/* NOTE: double-labeled `_name' and `name' for System V compatability. */ +/* NOTE: Mixed C/C++-style comments used. Sorry! */ + + .text + .align 2 + + .globl _qt_abort + .globl qt_abort + .globl _qt_block + .globl qt_block + .globl _qt_blocki + .globl qt_blocki + .globl _qt_align + .globl qt_align + +_qt_abort: +qt_abort: +_qt_block: +qt_block: +_qt_blocki: +qt_blocki: + /* 11 (return address.) */ + pushq %rbp /* 10 (push stack frame top.) */ + movq %rsp, %rbp /* set new stack frame top. */ + /* save registers. */ + subq $8, %rsp /* 9 (Stack alignment) */ + pushq %r12 /* 8 ... */ + pushq %r13 /* 7 ... */ + pushq %r14 /* 6 ... */ + pushq %r15 /* 5 ... */ + pushq %rbx /* 4 ... */ + pushq %rcx /* 3 ... (new stack address) */ + pushq %rdx /* 2 ... (arg) */ + pushq %rdi /* 1 ... (address of save function.) */ + pushq %rsi /* 0 ... (cor) */ + + movq %rdi, %rax /* get address of save function. */ + movq %rsp, %rdi /* set current stack as save argument. */ + movq %rcx, %rsp /* swap stacks. */ + movq %rcx, %rbp /* adjust stack frame pointer. */ + addq $10*8, %rbp /* ... */ + call *%rax /* call function to save stack pointer. */ + + /* restore registers. */ + popq %rsi /* ... */ + popq %rdi /* ... */ + popq %rdx /* ... */ + popq %rcx /* ... */ + popq %rbx /* ... */ + popq %r15 /* restore registers from new stack. */ + popq %r14 /* ... */ + popq %r13 /* ... */ + popq %r12 /* ... */ + leave /* unwind stack. */ +_qt_align: +qt_align: + ret /* return. */ diff --git a/ext/systemc/src/sysc/qt/md/ksr1.Makefile b/ext/systemc/src/sysc/qt/md/ksr1.Makefile new file mode 100644 index 000000000..aa195839a --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/ksr1.Makefile @@ -0,0 +1,6 @@ + +# +# KSR1 configuration. +# +CC = cc -ansi + diff --git a/ext/systemc/src/sysc/qt/md/ksr1.h b/ext/systemc/src/sysc/qt/md/ksr1.h new file mode 100644 index 000000000..b3877505d --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/ksr1.h @@ -0,0 +1,164 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_KSR1_H +#define QUICKTHREADS_KSR1_H + +/* + Stack layout: + + Registers are saved in strictly low to high order, FPU regs first + (only if qt_block is called), CEU regs second, IPU regs next, with no + padding between the groups. + + Callee-save: f16..f63; c15..c30; i12..i30. + Args passed in i2..i5. + + Note: c31 is a private data pointer. It is not changed on thread + swaps with the assumption that it represents per-processor rather + than per-thread state. + + Note: i31 is an instruction count register that is updated by the + context switch routines. Like c31, it is not changed on context + switches. + + This is what we want on startup: + + + +------ <-- BOS: Bottom of stack (grows down) + | 80 (128 - 48) bytes of padding to a 128-byte boundary + +--- + | only + | userf + | t + | u + | qt_start$TXT + | (empty) <-- qt.sp + +------ <-- (BOS - 128) + + This is why we want this on startup: + + A thread begins running when the restore procedure switches thread stacks + and pops a return address off of the top of the new stack (see below + for the reason why we explicitly store qt_start$TXT). The + block procedure pushes two jump addresses on a thread's stack before + it switches stacks. The first is the return address for the block + procedure, and the second is a restore address. The return address + is used to jump back to the thread that has been switched to; the + restore address is a jump within the block code to restore the registers. + Normally, this is just a jump to the next address. However, on thread + startup, this is a jump to qt_start$TXT. (The block procedure stores + the restore address at an offset of 8 bytes from the top of the stack, + which is also the offset at which qt_start$TXT is stored on the stacks + of new threads. Hence, when the block procedure switches to a new + thread stack, it will initially jump to qt_start$TXT; thereafter, + it jumps to the restore code.) + + qt_start$TXT, after it has read the initial data on the new thread's + stack and placed it in registers, pops the initial stack frame + and gives the thread the entire stack to use for execution. + + The KSR runtime system has an unusual treatment of pointers to + functions. From C, taking the `name' of a function yields a + pointer to a _constant block_ and *not* the address of the + function. The zero'th entry in the constant block is a pointer to + the function. + + We have to be careful: the restore procedure expects a return + address on the top of the stack (pointed to by qt.sp). This is not + a problem when restoring a thread that has run before, since the + block routine would have stored the return address on top of the + stack. However, when ``faking up'' a thread start (bootstrapping a + thread stack frame), the top of the stack needs to contain a + pointer to the code that will start the thread running. + + The pointer to the startup code is *not* `qt_start'. It is the + word *pointed to* by `qt_start'. Thus, we dereference `qt_start', + see QUICKTHREADS_ARGS_MD below. + + On varargs startup (still unimplemented): + + | padding to 128 byte boundary + | varargs <-- padded to a 128-byte-boundary + +--- + | caller's frame, 16 bytes + | 80 bytes of padding (frame padded to a 128-byte boundary) + +--- + | cleanup + | vuserf + | startup + | t + +--- + | qt_start <-- qt.sp + +--- + + Of a suspended thread: + + +--- + | caller's frame, 16 bytes + | fpu registers 47 regs * 8 bytes/reg 376 bytes + | ceu registers 16 regs * 8 bytes/reg 128 bytes + | ipu registers 19 regs * 8 bytes/reg 152 bytes + | : + | 80 bytes of padding + | : + | qt_restore <-- qt.sp + +--- + + */ + + +#define QUICKTHREADS_STKALIGN 128 +#define QUICKTHREADS_GROW_DOWN +typedef unsigned long qt_word_t; + +#define QUICKTHREADS_STKBASE QUICKTHREADS_STKALIGN +#define QUICKTHREADS_VSTKBASE QUICKTHREADS_STKBASE + +extern void qt_start(void); +/* + * See the discussion above for what indexing into a procedure ptr + * does for us (it's lovely, though, isn't it?). + * + * This assumes that the address of a procedure's code is the + * first word in a procedure's constant block. That's how the manual + * says it will be arranged. + */ +#define QUICKTHREADS_ARGS_MD(sp) (QUICKTHREADS_SPUT (sp, 1, ((qt_word_t *)qt_start)[0])) + +/* + * The *index* (positive offset) of where to put each value. + * See the picture of the stack above that explains the offsets. + */ +#define QUICKTHREADS_ONLY_INDEX (5) +#define QUICKTHREADS_USER_INDEX (4) +#define QUICKTHREADS_ARGT_INDEX (3) +#define QUICKTHREADS_ARGU_INDEX (2) + +#define QUICKTHREADS_VARGS_DEFAULT +#define QUICKTHREADS_VARGS(sp, nb, vargs, pt, startup, vuserf, cleanup) \ + (qt_vargs (sp, nbytes, &vargs, pt, startup, vuserf, cleanup)) + + +#define QUICKTHREADS_VARGS_MD0(sp, vabytes) \ + ((qt_t *)(((char *)(sp)) - 4*8 - QUICKTHREADS_STKROUNDUP(vabytes))) + +extern void qt_vstart(void); +#define QUICKTHREADS_VARGS_MD1(sp) (QUICKTHREADS_SPUT (sp, 0, ((qt_word_t *)qt_vstart)[0])) + +#define QUICKTHREADS_VCLEANUP_INDEX (4) +#define QUICKTHREADS_VUSERF_INDEX (3) +#define QUICKTHREADS_VSTARTUP_INDEX (2) +#define QUICKTHREADS_VARGT_INDEX (1) + +#endif /* def QUICKTHREADS_KSR1_H */ diff --git a/ext/systemc/src/sysc/qt/md/ksr1.s b/ext/systemc/src/sysc/qt/md/ksr1.s new file mode 100644 index 000000000..d4d51a0a6 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/ksr1.s @@ -0,0 +1,424 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .file "ksr1.s" + .def .debug; .endef + + .align 128 + .globl qt_blocki + .globl qt_blocki$TXT + .globl qt_block + .globl qt_block$TXT + .globl qt_start$TXT + .globl qt_start + .globl qt_abort$TXT + .globl qt_abort + .globl qt_vstart + .globl qt_vstart$TXT + +# +# KSR convention: on procedure calls, load both the procedure address +# and a pointer to a constant block. The address of function `f' is +# `f$TXT', and the constant block address is `f'. The constant block +# has several reserved values: +# +# 8 bytes fpu register save mask +# 4 bytes ipu register save mask +# 4 bytes ceu register save mask +# f: f$TXT +# ... whatever you want ... (not quite...read on) +# +# Note, by the way, that a pointer to a function is passed as a +# pointer to the constant area, and the constant area has the text +# address. +# + +# +# Procedures that do not return structures prefix their code with +# +# proc$TXT: +# finop; cxnop +# finop; cxnop +# <proc code> +# +# Calls to those procedures branch to a 16 byte offset (4 instrs) in +# to the procedure to skip those instructions. +# +# Procedures that return structures use a different code prefix: +# +# proc$TXT: +# finop; beq.qt %rc, %rc, 24 # return value entry +# finop; cxnop +# finop; movi8 0, %rc # no return value entry +# <proc code> +# +# Calls that want the returned structure branch directly to the +# procedure address. Callers that don't want (or aren't expecting) a +# return value branche 16 bytes in to the procedure, which will zero +# %rc, telling the called procedure not to return a structure. +# + +# +# On entry: +# %i2 -- control block of helper function to run +# (dereference to get helper) +# %i3 -- a1 +# %i4 -- a2 +# %i5 -- sp of new to run +# + + .data + .half 0x0, 0x0, 0x7ffff000, 0x7fff8000 +qt_blocki: +qt_abort: + .word qt_blocki$TXT + .word qt_restore$TXT + + .text +qt_abort$TXT: +qt_blocki$TXT: + finop ; cxnop # entry prefix + finop ; cxnop # entry prefix + add8.ntr 75,%i31,%i31 ; movi8 512,%c5 # ICR; stk adjust + finop ; ssub8.ntr 0,%sp,%c5,%sp + finop ; st8 %fp,504(%sp) # Save caller's fp + finop ; st8 %cp,496(%sp) # Save caller's cp + finop ; ld8 8(%c10),%c5 # ld qt_restore$TXT + finop ; st8 %c14,0(%sp) # Save special ret addr + finop ; mov8_8 %c10, %cp # Our cp + finop ; sadd8.ntr 0,%sp,%c5,%fp # Our frame ptr + finop ; st8 %c5,8(%sp) # st qt_restore$TXT +# +# CEU registers %c15-%c24, %c26-%c30 (%c14 we restore later) +# + finop ; st8 %c15,456(%sp) + finop ; st8 %c16,448(%sp) + finop ; st8 %c17,440(%sp) + finop ; st8 %c18,432(%sp) + finop ; st8 %c19,424(%sp) + finop ; st8 %c20,416(%sp) + finop ; st8 %c21,408(%sp) + finop ; st8 %c22,400(%sp) + finop ; st8 %c23,392(%sp) + finop ; st8 %c24,384(%sp) +# +# %c25 is the Enclosing Frame Pointer (EFP) -- since C doesn't +# use nested procedures, we ignore it (leaving a gap, though) +# + finop ; st8 %c26,368(%sp) + finop ; st8 %c27,360(%sp) + finop ; st8 %c28,352(%sp) + finop ; st8 %c29,344(%sp) + finop ; st8 %c30,336(%sp) +# +# IPU registers %i12-%i30 +# + finop ; st8 %i12,328(%sp) + finop ; st8 %i13,320(%sp) + finop ; st8 %i14,312(%sp) + finop ; st8 %i15,304(%sp) +# (gap to get alignment for st64) +# -- Doesn't work on version 1.1.3 of the OS +# finop ; st64 %i16,256(%sp) + + finop ; st8 %i16,256(%sp) + finop ; st8 %i17,248(%sp) + finop ; st8 %i18,240(%sp) + finop ; st8 %i19,232(%sp) + finop ; st8 %i20,224(%sp) + finop ; st8 %i21,216(%sp) + finop ; st8 %i22,208(%sp) + finop ; st8 %i23,200(%sp) + finop ; st8 %i24,192(%sp) + finop ; st8 %i25,184(%sp) + finop ; st8 %i26,176(%sp) + finop ; st8 %i27,168(%sp) + finop ; st8 %i28,160(%sp) + finop ; st8 %i29,152(%sp) + finop ; st8 %i30,144(%sp) +# +# FPU already saved, or saving not necessary +# + +# +# Switch to the stack passed in as fourth argument to the block +# routine (%i5) and call the helper routine passed in as the first +# argument (%i2). Note that the address of the helper's constant +# block is passed in, so we must derefence it to get the helper's text +# address. +# + finop ; movb8_8 %i2,%c10 # helper's ConstBlock + finop ; cxnop # Delay slot, fill w/ + finop ; cxnop # .. 2 st8 from above + finop ; ld8 0(%c10),%c4 # load addr of helper + finop ; movb8_8 %sp, %i2 # 1st arg to helper + # is this stack; other + # args remain in regs + finop ; movb8_8 %i5,%sp # switch stacks + finop ; jsr %c14,16(%c4) # call helper + movi8 3, %i0 ; movi8 0,%c8 # nargs brain dmg + finop ; cxnop + finop ; cxnop +# +# Here is where behavior differs for threads being restored and threads +# being started. Blocked threads have a pointer to qt_restore$TXT on +# the top of their stacks; manufactured stacks have a pointer to qt_start$TXT +# on the top of their stacks. With this setup, starting threads +# skip the (unecessary) restore operations. +# +# We jump to an offset of 16 to either (1) skip past the two noop pairs +# at the start of qt_start$TXT, or (2) skip past the two noop pairs +# after qt_restore$TXT. +# + finop ; ld8 8(%sp),%c4 + finop ; cxnop + finop ; cxnop + finop ; jmp 16(%c4) +qt_restore$TXT: + finop ; cxnop + finop ; cxnop +# +# Point of Restore: +# +# The helper funtion will return here. Any result it has placed in +# a return register (most likely %i0) will not get overwritten below +# and will consequently be the return value of the blocking routine. +# + +# +# CEU registers %c15-%c24, %c26-%c30 (%c14 we restore later) +# + finop ; ld8 456(%sp),%c15 + finop ; ld8 448(%sp),%c16 + finop ; ld8 440(%sp),%c17 + finop ; ld8 432(%sp),%c18 + finop ; ld8 424(%sp),%c19 + finop ; ld8 416(%sp),%c20 + finop ; ld8 408(%sp),%c21 + finop ; ld8 400(%sp),%c22 + finop ; ld8 392(%sp),%c23 + finop ; ld8 384(%sp),%c24 +# +# %c25 is the Enclosing Frame Pointer (EFP) -- since C doesn't +# use nested procedures, we ignore it (leaving a gap, though) +# + finop ; ld8 368(%sp),%c26 + finop ; ld8 360(%sp),%c27 + finop ; ld8 352(%sp),%c28 + finop ; ld8 344(%sp),%c29 + finop ; ld8 336(%sp),%c30 +# +# IPU registers %i12-%i30 +# + finop ; ld8 328(%sp),%i12 + finop ; ld8 320(%sp),%i13 + finop ; ld8 312(%sp),%i14 + finop ; ld8 304(%sp),%i15 +# (gap to get alignment for ld64) +# -- Doesn't work on version 1.1.3 of the OS +# finop ; ld64 256(%sp),%i16 + + finop ; ld8 256(%sp),%i16 + finop ; ld8 248(%sp),%i17 + finop ; ld8 240(%sp),%i18 + finop ; ld8 232(%sp),%i19 + finop ; ld8 224(%sp),%i20 + finop ; ld8 216(%sp),%i21 + finop ; ld8 208(%sp),%i22 + finop ; ld8 200(%sp),%i23 + finop ; ld8 192(%sp),%i24 + finop ; ld8 184(%sp),%i25 + finop ; ld8 176(%sp),%i26 + finop ; ld8 168(%sp),%i27 + finop ; ld8 160(%sp),%i28 + finop ; ld8 152(%sp),%i29 + finop ; ld8 144(%sp),%i30 + +# +# FPU registers don't need to be loaded, or will be loaded by an +# enclosing scope (e.g., if this is called by qt_block). +# + +# +# Load the special registers. We don't load the stack ptr because +# the new stack is passed in as an argument, we don't load the EFP +# because we don't use it, and we load the return address specially +# off the top of the stack. +# + finop ; ld8 0(%sp),%c14 # return addr + finop ; ld8 496(%sp),%cp + finop ; ld8 504(%sp),%fp + + finop ; jmp 32(%c14) # jump back to thread + finop ; movi8 512,%c5 # stack adjust + finop ; sadd8.ntr 0,%sp,%c5,%sp + + .data + .half 0x0, 0x0, 0x7ffff000, 0x7fff8000 +qt_block: + .word qt_block$TXT + .word qt_error + .word qt_error$TXT + .word qt_blocki +# +# Handle saving and restoring the FPU regs, relying on qt_blocki +# to save and restore the remaining registers. +# + .text +qt_block$TXT: + finop ; cxnop # entry prefix + finop ; cxnop # entry prefix + + add8.ntr 29,%i31,%i31 ; movi8 512,%c5 # ICR; stk adjust + finop ; ssub8.ntr 0,%sp,%c5,%sp + finop ; st8 %fp,504(%sp) # Save caller's fp + finop ; st8 %cp,496(%sp) # Save caller's cp + finop ; st8 %c14,488(%sp) # store ret addr + finop ; sadd8.ntr 0,%sp,%c5,%fp # Our frame ptr + finop ; mov8_8 %c10, %cp # Our cp + +# +# Store 8 registers at once...destination must be a multiple of 64 +# + finop ; st64 %f16,384(%sp) + finop ; st64 %f24,320(%sp) + finop ; st64 %f32,256(%sp) + finop ; st64 %f40,192(%sp) + finop ; st64 %f48,128(%sp) + finop ; st64 %f56,64(%sp) + +# +# Call the integer blocking routine, passing the arguments passed to us +# + finop ; ld8 24(%cp), %c10 + finop ; cxnop + finop ; jsr %c14, qt_blocki$TXT + finop ; cxnop + finop ; cxnop + movi8 4,%i0 ; movi8 0,%c8 # nargs brain dmg + +# +# Load 8 registers at once...source must be a multiple of 64 +# + finop ; ld64 64(%sp),%f56 + finop ; ld64 128(%sp),%f48 + finop ; ld64 192(%sp),%f40 + finop ; ld64 256(%sp),%f32 + finop ; ld64 320(%sp),%f24 + finop ; ld64 384(%sp),%f16 + + finop ; ld8 488(%sp),%c14 + finop ; ld8 496(%sp),%cp + finop ; ld8 504(%sp),%fp + finop ; jmp 32(%c14) # jump back to thread + finop ; movi8 512,%c5 # stack adjust + finop ; sadd8.ntr 0,%sp,%c5,%sp + + + .data + .half 0x0, 0x0, 0x7ffff000, 0x7fff8000 +qt_start: + .word qt_start$TXT +# +# A new thread is set up to "appear" as if it were executing code at +# the beginning of qt_start and then it called a blocking routine +# (qt_blocki). So when a new thread starts to run, it gets unblocked +# by the code above and "returns" to `qt_start$TXT' in the +# restore step of the switch. Blocked threads jump to 16(qt_restore$TXT), +# and starting threads jump to 16(qt_start$TXT). +# + .text +qt_start$TXT: + finop ; cxnop # + finop ; cxnop # + finop ; ld8 40(%sp),%c10 # `only' constant block + finop ; ld8 32(%sp),%i4 # `userf' arg. + finop ; ld8 24(%sp),%i3 # `t' arg. + finop ; ld8 0(%c10),%c4 # `only' text location + finop ; ld8 16(%sp),%i2 # `u' arg. + finop ; cxnop + finop ; jsr %c14,16(%c4) # call `only' +# +# Pop the frame used to store the thread's initial data +# + finop ; sadd8.ntr 0,%sp,128,%sp + finop ; cxnop + movi8 2,%i0 ; movi8 0,%c8 # nargs brain dmg +# +# If we ever return, it's an error. +# + finop ; jmp qt_error$TXT + finop ; cxnop + finop ; cxnop + movi8 0,%i0 ; movi8 0,%c8 # nargs brain dmg + + +# +# This stuff is broken +# + .data + .half 0x0, 0x0, 0x7ffff000, 0x7fff8000 +qt_vstart: + .word qt_vstart$TXT + + .text +qt_vstart$TXT: + finop ; cxnop # entry prefix + finop ; cxnop # entry prefix + finop ; cxnop + finop ; cxnop + add8.ntr 11,%i31,%i31 ; movi8 512,%c5 + finop ; ssub8.ntr 0,%sp,%c5,%sp # fix stack + finop ; ld8 8(%sp),%i2 # load `t' as arg to + finop ; cxnop # `startup' + finop ; cxnop + finop ; ld8 16(%sp),%c10 # `startup' const block + finop ; cxnop + finop ; cxnop + finop ; ld8 0(%c10),%c4 # `startup' text loc. + finop ; cxnop + finop ; cxnop + finop ; jsr %c14,16(%c4) # call `startup' + finop ; cxnop + finop ; cxnop + movi8 1, %i0 ; movi8 0,%c8 # nargs brain dmg +# +# finop ; sadd 0,%sp,128,%sp # alter stack +# + finop ; ld8 8(%sp),%i2 # load `t' as arg to + finop ; ld8 8(%sp),%i2 # load `t' as arg to + finop ; ld8 8(%sp),%i2 # load `t' as arg to + finop ; ld8 8(%sp),%i2 # load `t' as arg to + + finop ; ld8 32(%sp),%c10 # `only' constant block + finop ; ld8 8(%sp),%i2 # `u' arg. + finop ; ld8 16(%sp),%i3 # `t' arg. + finop ; ld8 0(%c10),%c4 # `only' text location + finop ; ld8 24(%sp),%i4 # `userf' arg. + finop ; cxnop + finop ; jsr %c4,16(%c4) # call `only' + finop ; cxnop + finop ; cxnop +# +# If the callee ever calls `nargs', the following instruction (pair) +# will be executed. However, we don't know when we compile this code +# how many args are being passed. So we give our best guess: 0. +# + movi8 0,%i0 ; movi8 0,%c8 # nargs brain dmg +# +# If we ever return, it's an error. +# + finop ; jmp qt_error$TXT + finop ; cxnop + finop ; cxnop + movi8 0,%i0 ; movi8 0,%c8 # nargs brain dmg diff --git a/ext/systemc/src/sysc/qt/md/ksr1_b.s b/ext/systemc/src/sysc/qt/md/ksr1_b.s new file mode 100644 index 000000000..80b0c59eb --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/ksr1_b.s @@ -0,0 +1,49 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .file "ksr1_b.s" + .def .debug; .endef + + .globl b_call_reg$TXT + .globl b_call_reg + .globl b_call_imm$TXT + .globl b_call_imm + .globl b_add$TXT + .globl b_add + .globl b_load$TXT + .globl b_load + + +b_call_reg: +b_call_imm: +b_add: +b_load: + .word b_call_reg$TXT + .word qt_error + .word qt_error$TXT + + +b_call_reg$TXT: +b_call_imm$TXT: +b_add$TXT: +b_load$TXT: + finop ; cxnop + finop ; cxnop + finop ; ld8 16(%cp),%c4 + finop ; ld8 8(%cp),%cp + finop ; cxnop + finop ; cxnop + finop ; jsr %c4,0(%c4) + finop ; cxnop + finop ; cxnop + diff --git a/ext/systemc/src/sysc/qt/md/m88k.Makefile b/ext/systemc/src/sysc/qt/md/m88k.Makefile new file mode 100644 index 000000000..608c70690 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/m88k.Makefile @@ -0,0 +1,6 @@ + +# +# Hosted compilers for 88k for Meerkat. +# +CC = gcc88 -Dm88k -ansi -pedantic -Wall -fno-builtin +AS = as88 diff --git a/ext/systemc/src/sysc/qt/md/m88k.c b/ext/systemc/src/sysc/qt/md/m88k.c new file mode 100644 index 000000000..f2cef00a0 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/m88k.c @@ -0,0 +1,111 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#include <stdarg.h> +#include "qt.h" + +/* Varargs is harder on the m88k. Parameters are saved on the stack as + something like (stack grows down to low memory; low at bottom of + picture): + + | : + | arg8 <-- va_list.__va_stk + +--- + | : + +--- + | arg7 + | : + | iarg0 <-- va_list.__va_reg + +--- + | : + | va_list { __va_arg, __va_stk, __va_reg } + | : + +--- + + Here, `va_list.__va_arg' is the number of word-size arguments + that have already been skipped. Doubles must be double-arligned. + + What this means for us is that the user's routine needs to be + called with an arg list where some of the words in the `__va_stk' + part of the parameter list have to be promoted to registers. + + BUG: doubleword register arguments must be double-aligned. If + something is passed as an even # arg and used as an odd # arg or + vice-versa, the code in the called routine (in the new thread) that + decides how to adjust the index will get it wrong, because it will + be expect it to be, say, doubleword aligned and it will really be + singleword aligned. + + I'm not sure you can solve this without knowing the types of all + the arguments. All in all, we never promised varargs would work + reliably. */ + + + +#define QUICKTHREADS_VADJ(sp) (((char *)sp) - QUICKTHREADS_VSTKBASE) + +/* Always allocate at least enough space for 8 args; waste some space + at the base of the stack to ensure the startup routine doesn't read + off the end of the stack. */ + +#define QUICKTHREADS_VARGS_MD0(sp, vabytes) \ + ((qt_t *)(((char *)(sp)) - 8*4 - QUICKTHREADS_STKROUNDUP(vabytes))) + +extern void qt_vstart(void); +#define QUICKTHREADS_VARGS_MD1(sp) (QUICKTHREADS_SPUT (sp, QUICKTHREADS_1, qt_vstart)) + + + struct qt_t * +qt_vargs (struct qt_t *qsp, int nbytes, void *vargs, + void *pt, qt_function_t *startup, + qt_function_t *vuserf, qt_function_t *cleanup) +{ + va_list ap; + int i; + int n; /* Number of words into original arg list. */ + qt_word_t *sp; + int *reg; /* Where to read passed-in-reg args. */ + int *stk; /* Where to read passed-on-stk args. */ + + ap = *(va_list *)vargs; + qsp = QUICKTHREADS_VARGS_MD0 (qsp, nbytes); + sp = (qt_word_t *)qsp; + + reg = (ap.__va_arg < 8) + ? &ap.__va_reg[ap.__va_arg] + : 0; + stk = &ap.__va_stk[8]; + n = ap.__va_arg; + for (i=0; i<nbytes/sizeof(qt_word_t) && n<8; ++i,++n) { + sp[i] = *reg++; + } + for (; i<nbytes/sizeof(qt_word_t); ++i) { + sp[i] = *stk++; + } + +#ifdef QUICKTHREADS_NDEF + for (i=0; i<nbytes/sizeof(qt_word_t); ++i) { + sp[i] = (n < 8) + ? *reg++ + : *stk++; + ++n; + } +#endif + + QUICKTHREADS_VARGS_MD1 (QUICKTHREADS_VADJ(sp)); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VARGT_INDEX, pt); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VSTARTUP_INDEX, startup); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VUSERF_INDEX, vuserf); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VCLEANUP_INDEX, cleanup); + return ((qt_t *)QUICKTHREADS_VADJ(sp)); +} diff --git a/ext/systemc/src/sysc/qt/md/m88k.h b/ext/systemc/src/sysc/qt/md/m88k.h new file mode 100644 index 000000000..f9cab5327 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/m88k.h @@ -0,0 +1,159 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_M88K_H +#define QUICKTHREADS_M88K_H + +typedef unsigned long qt_word_t; + +#define QUICKTHREADS_GROW_DOWN + +/* Stack layout on the mips: + + Callee-save registers are: $16-$23, $30; $f20-$f30. + Also save $31, return pc. + + Non-varargs: + + +--- + | r30 (fp) on startup === 0 + | r25 + | r24 + | r23 + | r22 + | r21 + | r20 + | r19 + | r18 + | r17 on startup === `only' + | r16 on startup === `userf' + | r15 on startup === `pt' + | r14 on startup === `pu' + | r1 on startup === `qt_start' + | 0 + | 0 + +--- + | 0 + | ... (8 regs worth === 32 bytes of homing area) + | 0 <--- sp + +--- + + Conventions for varargs: + + | : + | arg8 + +--- + | r30 (fp) arg7 + | r25 arg6 + | r24 arg5 + | r23 arg4 + | r22 arg3 + | r21 arg2 + | r20 arg1 + | r19 arg0 + | r18 + | r17 on startup === `startup' + | r16 on startup === `vuserf' + | r15 on startup === `pt' + | r14 on startup === `cleanup' + | r1 on startup === `qt_vstart' + | 0 + | 0 + +--- + | 0 + | ... (8 regs worth === 32 bytes of homing area) + | 0 <--- sp + +--- + + */ + + +/* Stack must be doubleword aligned. */ +#define QUICKTHREADS_STKALIGN (16) /* Doubleword aligned. */ + +/* How much space is allocated to hold all the crud for + initialization: saved registers plus padding to keep the stack + aligned plus 8 words of padding to use as a `homing area' (for + r2-r9) when calling helper functions on the stack of the (not yet + started) thread. The varargs save area is small because it gets + overlapped with the top of the parameter list. In case the + parameter list is less than 8 args, QUICKTHREADS_ARGS_MD0 adds some dead + space at the top of the stack. */ + +#define QUICKTHREADS_STKBASE (16*4 + 8*4) +#define QUICKTHREADS_VSTKBASE (8*4 + 8*4) + + +/* Index of various registers. */ +#define QUICKTHREADS_1 (8+2) +#define QUICKTHREADS_14 (8+3) +#define QUICKTHREADS_15 (8+4) +#define QUICKTHREADS_16 (8+5) +#define QUICKTHREADS_17 (8+6) +#define QUICKTHREADS_30 (8+15) + + +/* When a never-before-run thread is restored, the return pc points + to a fragment of code that starts the thread running. For + non-vargs functions, it sets up arguments and calls the client's + `only' function. For varargs functions, the startup code calls the + startup, user, and cleanup functions. + + For non-varargs functions, we set the frame pointer to 0 to + null-terminate the call chain. + + For varargs functions, the frame pointer register is used to hold + one of the arguments, so that all arguments can be laid out in + memory by the conventional `qt_vargs' varargs initialization + routine. + + The varargs startup routine always reads 8 words of arguments from + the stack. If there are less than 8 words of arguments, then the + arg list could call off the top of the stack. To prevent fall-off, + always allocate 8 words. */ + +extern void qt_start(void); +#define QUICKTHREADS_ARGS_MD(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_1, qt_start), \ + QUICKTHREADS_SPUT (sp, QUICKTHREADS_30, 0)) + + +/* The m88k uses a struct for `va_list', so pass a pointer to the + struct. */ + +typedef void (qt_function_t)(void); + +struct qt_t; +extern struct qt_t *qt_vargs (struct qt_t *sp, int nbytes, + void *vargs, void *pt, + qt_function_t *startup, + qt_function_t *vuserf, + qt_function_t *cleanup); + +#define QUICKTHREADS_VARGS(sp, nbytes, vargs, pt, startup, vuserf, cleanup) \ + (qt_vargs (sp, nbytes, &(vargs), pt, (qt_function_t *)startup, \ + (qt_function_t *)vuserf, (qt_function_t *)cleanup)) + + +/* The *index* (positive offset) of where to put each value. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_17) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_16) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_15) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_14) + +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_14) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_16) +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_17) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_15) + +#endif /* ndef QUICKTHREADS_M88K_H */ diff --git a/ext/systemc/src/sysc/qt/md/m88k.s b/ext/systemc/src/sysc/qt/md/m88k.s new file mode 100644 index 000000000..42467e8d5 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/m88k.s @@ -0,0 +1,132 @@ +/* m88k.s -- assembly support. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* Callee-save r14..r25, r31(sp), r30(fp). r1 === return pc. + * Argument registers r2..r9, return value r2..r3. + * + * On startup, restore regs so retpc === call to a function to start. + * + * We're going to call a function (r2) from within the context switch + * routine. Call it on the new thread's stack on behalf of the old + * thread. + */ + + .globl _qt_block + .globl _qt_blocki + .globl _qt_abort + .globl _qt_start + .globl _qt_vstart + + /* + ** r2: ptr to function to call once curr is suspended + ** and control is on r5's stack. + ** r3: 1'th arg to *r2. + ** r4: 2'th arg to *r2. + ** r5: sp of thread to suspend. + ** + ** The helper routine returns a value that is passed on as the + ** return value from the blocking routine. Since we don't + ** touch r2 between the helper's return and the end of + ** function, we get this behavior for free. + ** + ** Same entry for integer-only and floating-point, since there + ** are no separate integer and floating-point registers. + ** + ** Each procedure call sets aside a ``home region'' of 8 regs + ** for r2-r9 for varargs. For context switches we don't use + ** the ``home region'' for varargs so use it to save regs. + ** Allocate 64 bytes of save space -- use 32 bytes of register + ** save area passed in to us plus 32 bytes we allcated, use + ** the other 32 bytes for save area for a save area to call + ** the helper function. + */ +_qt_block: +_qt_blocki: + sub r31, r31,64 /* Allocate reg save space. */ + st r1, r31,8+32 /* Save callee-save registers. */ + st r14, r31,12+32 + st.d r15, r31,16+32 + st.d r17, r31,24+32 + st.d r19, r31,32+32 + st.d r21, r31,40+32 + st.d r23, r31,48+32 + st r25, r31,56+32 + st r30, r31,60+32 + +_qt_abort: + addu r14, r31,0 /* Remember old sp. */ + addu r31, r5,0 /* Set new sp. */ + jsr.n r2 /* Call helper. */ + addu r2, r14,0 /* Pass old sp as an arg0 to helper. */ + + ld r1, r31,8+32 /* Restore callee-save registers. */ + ld r14, r31,12+32 + ld.d r15, r31,16+32 + ld.d r17, r31,24+32 + ld.d r19, r31,32+32 + ld.d r21, r31,40+32 + ld.d r23, r31,48+32 + ld r25, r31,56+32 + ld r30, r31,60+32 + + jmp.n r1 /* Return to new thread's caller. */ + addu r31, r31,64 /* Free register save space. */ + + + /* + ** Non-varargs thread startup. + ** See `m88k.h' for register use conventions. + */ +_qt_start: + addu r2, r14,0 /* Set user arg `pu'. */ + addu r3, r15,0 /* ... user function pt. */ + jsr.n r17 /* Call `only'. */ + addu r4, r16,0 /* ... user function userf. */ + + bsr _qt_error /* `only' erroniously returned. */ + + + /* + ** Varargs thread startup. + ** See `m88k.h' for register use conventions. + ** + ** Call the `startup' function with just argument `pt'. + ** Then call `vuserf' with 8 register args plus any + ** stack args. + ** Then call `cleanup' with `pt' and the return value + ** from `vuserf'. + */ +_qt_vstart: + addu r18, r30,0 /* Remember arg7 to `vuserf'. */ + addu r30, r0,0 /* Null-terminate call chain. */ + + jsr.n r17 /* Call `startup'. */ + addu r2, r15,0 /* `pt' is arg0 to `startup'. */ + + addu r2, r19,0 /* Set arg0. */ + addu r3, r20,0 /* Set arg1. */ + addu r4, r21,0 /* Set arg2. */ + addu r5, r22,0 /* Set arg3. */ + addu r6, r23,0 /* Set arg4. */ + addu r7, r24,0 /* Set arg5. */ + addu r8, r25,0 /* Set arg6. */ + jsr.n r16 /* Call `vuserf'. */ + addu r9, r18,0 /* Set arg7. */ + + addu r3, r2,0 /* Ret. value is arg1 to `cleanup'. */ + jsr.n r14 /* Call `cleanup'. */ + addu r2, r15,0 /* `pt' is arg0 to `cleanup'. */ + + bsr _qt_error /* `cleanup' erroniously returned. */ diff --git a/ext/systemc/src/sysc/qt/md/m88k_b.s b/ext/systemc/src/sysc/qt/md/m88k_b.s new file mode 100644 index 000000000..1926e6ae8 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/m88k_b.s @@ -0,0 +1,117 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .text + .globl _b_call_reg + .globl _b_call_imm + .globl _b_add + .globl _b_load + +_b_null: + jmp r1 + +_b_call_reg: + subu r31, r31,8 /* Alloc ret pc save space. */ + st r1, r31,32 /* Save ret pc. */ + or.u r3, r0,hi16(_b_null) /* Put call addr in a reg. */ + or r3, r3,lo16(_b_null) + jsr r3 +L0: + jsr r3 + jsr r3 + jsr r3 + jsr.n r3 + subu r2, r2,5 /* Decrement #of iter to go. */ + bcnd.n gt0,r2,L0 + jsr r3 + + ld r1, r31,32 + jmp r1 + + +_b_call_imm: + subu r31, r31,8 /* Alloc ret pc save space. */ + st r1, r31,32 /* Save ret pc. */ + bsr _b_null +L1: + bsr _b_null + bsr _b_null + bsr _b_null + bsr.n _b_null + subu r2, r2,5 /* Decrement #of iter to go. */ + bcnd.n gt0,r2,L1 + bsr _b_null + + ld r1, r31,32 + jmp r1 + +_b_add: + add r0, r3,r4 +L2: + add r3, r4,r5 + add r4, r5,r6 + add r5, r6,r7 + add r8, r9,r0 + add r0, r3,r4 + add r3, r4,r5 + add r4, r5,r6 + add r5, r6,r7 + add r8, r9,r0 + + add r0, r3,r4 + add r3, r4,r5 + add r4, r5,r6 + add r5, r6,r7 + add r8, r9,r0 + add r0, r3,r4 + add r3, r4,r5 + add r4, r5,r6 + add r5, r6,r7 + add r8, r9,r0 + + subu r2, r2,20 /* Decrement #of iter to go. */ + bcnd.n gt0,r2,L2 + add r0, r3,r4 + + jmp r1 + + +_b_load: + ld r0, r31,0 +L3: + ld r3, r31,4 + ld r4, r31,8 + ld r5, r31,12 + ld r6, r31,16 + ld r0, r31,0 + ld r3, r31,4 + ld r4, r31,8 + ld r5, r31,12 + ld r6, r31,16 + + ld r0, r31,0 + ld r3, r31,4 + ld r4, r31,8 + ld r5, r31,12 + ld r6, r31,16 + ld r0, r31,0 + ld r3, r31,4 + ld r4, r31,8 + ld r5, r31,12 + ld r6, r31,16 + + subu r2, r2,20 /* Decrement #of iter to go. */ + bcnd.n gt0,r2,L3 + ld r0, r31,0 + + jmp r1 diff --git a/ext/systemc/src/sysc/qt/md/mips-irix5.s b/ext/systemc/src/sysc/qt/md/mips-irix5.s new file mode 100644 index 000000000..234a953ed --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/mips-irix5.s @@ -0,0 +1,182 @@ +/* mips.s -- assembly support. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* Callee-save $16-$23, $30-$31. + * + * $25 is used as a procedure value pointer, used to discover constants + * in a callee. Thus, each caller here sets $25 before the call. + * + * On startup, restore regs so retpc === call to a function to start. + * We're going to call a function ($4) from within this routine. + * We're passing 3 args, therefore need to allocate 12 extra bytes on + * the stack for a save area. The start routine needs a like 16-byte + * save area. Must be doubleword aligned (_mips r3000 risc + * architecture_, gerry kane, pg d-23). + */ + +/* + * Modified by Assar Westerlund <assar@sics.se> to support Irix 5.x + * calling conventions for dynamically-linked code. + */ + + /* Make this position-independent code. */ + .option pic2 + + .globl qt_block + .globl qt_blocki + .globl qt_abort + .globl qt_start + .globl qt_vstart + + /* + ** $4: ptr to function to call once curr is suspended + ** and control is on $7's stack. + ** $5: 1'th arg to $4. + ** $6: 2'th arg to $4 + ** $7: sp of thread to suspend. + ** + ** Totally gross hack: The MIPS calling convention reserves + ** 4 words on the stack for a0..a3. This routine "ought" to + ** allocate space for callee-save registers plus 4 words for + ** the helper function, but instead we use the 4 words + ** provided by the function that called us (we don't need to + ** save our argument registers). So what *appears* to be + ** allocating only 40 bytes is actually allocating 56, by + ** using the caller's 16 bytes. + ** + ** The helper routine returns a value that is passed on as the + ** return value from the blocking routine. Since we don't + ** touch $2 between the helper's return and the end of + ** function, we get this behavior for free. + */ +qt_blocki: + sub $sp,$sp,40 /* Allocate reg save space. */ + sw $16, 0+16($sp) + sw $17, 4+16($sp) + sw $18, 8+16($sp) + sw $19,12+16($sp) + sw $20,16+16($sp) + sw $21,20+16($sp) + sw $22,24+16($sp) + sw $23,28+16($sp) + sw $30,32+16($sp) + sw $31,36+16($sp) + add $2, $sp,$0 /* $2 <= old sp to pass to func@$4. */ +qt_abort: + add $sp, $7,$0 /* $sp <= new sp. */ + .set noreorder + add $25, $4,$0 /* Set helper function procedure value. */ + jal $31,$25 /* Call helper func@$4 . */ + add $4, $2,$0 /* $a0 <= pass old sp as a parameter. */ + .set reorder + lw $31,36+16($sp) /* Restore callee-save regs... */ + lw $30,32+16($sp) + lw $23,28+16($sp) + lw $22,24+16($sp) + lw $21,20+16($sp) + lw $20,16+16($sp) + lw $19,12+16($sp) + lw $18, 8+16($sp) + lw $17, 4+16($sp) + lw $16, 0+16($sp) /* Restore callee-save */ + + add $sp,$sp,40 /* Deallocate reg save space. */ + j $31 /* Return to caller. */ + + /* + ** Non-varargs thread startup. + ** Note: originally, 56 bytes were allocated on the stack. + ** The thread restore routine (_blocki/_abort) removed 40 + ** of them, which means there is still 16 bytes for the + ** argument area required by the MIPS calling convention. + */ +qt_start: + add $4, $16,$0 /* Load up user function pu. */ + add $5, $17,$0 /* ... user function pt. */ + add $6, $18,$0 /* ... user function userf. */ + add $25, $19,$0 /* Set `only' procedure value. */ + jal $31,$25 /* Call `only'. */ + la $25,qt_error /* Set `qt_error' procedure value. */ + j $25 + + + /* + ** Save calle-save floating-point regs $f20-$f30 + ** See comment in `qt_block' about calling conventinos and + ** reserved space. Use the same trick here, but here we + ** actually have to allocate all the bytes since we have to + ** leave 4 words leftover for `qt_blocki'. + ** + ** Return value from `qt_block' is the same as the return from + ** `qt_blocki'. We get that for free since we don't touch $2 + ** between the return from `qt_blocki' and the return from + ** `qt_block'. + */ +qt_block: + sub $sp, $sp,56 /* 6 8-byte regs, saved ret pc, aligned. */ + swc1 $f20, 0+16($sp) + swc1 $f22, 8+16($sp) + swc1 $f24, 16+16($sp) + swc1 $f26, 24+16($sp) + swc1 $f28, 32+16($sp) + swc1 $f30, 40+16($sp) + sw $31, 48+16($sp) + jal qt_blocki + lwc1 $f20, 0+16($sp) + lwc1 $f22, 8+16($sp) + lwc1 $f24, 16+16($sp) + lwc1 $f26, 24+16($sp) + lwc1 $f28, 32+16($sp) + lwc1 $f30, 40+16($sp) + lw $31, 48+16($sp) + add $sp, $sp,56 + j $31 + + + /* + ** First, call `startup' with the `pt' argument. + ** + ** Next, call the user's function with all arguments. + ** Note that we don't know whether args were passed in + ** integer regs, fp regs, or on the stack (See Gerry Kane + ** "MIPS R2000 RISC Architecture" pg D-22), so we reload + ** all the registers, possibly with garbage arguments. + ** + ** Finally, call `cleanup' with the `pt' argument and with + ** the return value from the user's function. It is an error + ** for `cleanup' to return. + */ +qt_vstart: + add $4, $17,$0 /* `pt' is arg0 to `startup'. */ + add $25, $18,$0 /* Set `startup' procedure value. */ + jal $31, $25 /* Call `startup'. */ + + add $sp, $sp,16 /* Free extra save space. */ + lw $4, 0($sp) /* Load up args. */ + lw $5, 4($sp) + lw $6, 8($sp) + lw $7, 12($sp) + lwc1 $f12, 0($sp) /* Load up fp args. */ + lwc1 $f14, 8($sp) + add $25, $19,$0 /* Set `userf' procedure value. */ + jal $31,$25 /* Call `userf'. */ + + add $4, $17,$0 /* `pt' is arg0 to `cleanup'. */ + add $5, $2,$0 /* Ret. val is arg1 to `cleanup'. */ + add $25, $16,$0 /* Set `cleanup' procedure value. */ + jal $31, $25 /* Call `cleanup'. */ + + la $25,qt_error /* Set `qt_error' procedure value. */ + j $25 diff --git a/ext/systemc/src/sysc/qt/md/mips.h b/ext/systemc/src/sysc/qt/md/mips.h new file mode 100644 index 000000000..14d109461 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/mips.h @@ -0,0 +1,134 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_MIPS_H +#define QUICKTHREADS_MIPS_H + +typedef unsigned long qt_word_t; + +#define QUICKTHREADS_GROW_DOWN + +/* Stack layout on the mips: + + Callee-save registers are: $16-$23, $30; $f20-$f30. + Also save $31, return pc. + + Non-varargs: + + +--- + | $f30 The first clump is only saved if `qt_block' + | $f28 is called, in which case it saves the fp regs + | $f26 then calls `qt_blocki' to save the int regs. + | $f24 + | $f22 + | $f20 + | $31 === return pc in `qt_block' + +--- + | $31 === return pc; on startup == qt_start + | $30 + | $23 + | $22 + | $21 + | $20 + | $19 on startup === only + | $18 on startup === $a2 === userf + | $17 on startup === $a1 === pt + | $16 on startup === $a0 === pu + | <a3> save area req'd by MIPS calling convention + | <a2> save area req'd by MIPS calling convention + | <a1> save area req'd by MIPS calling convention + | <a0> save area req'd by MIPS calling convention <--- sp + +--- + + Conventions for varargs: + + | args ... + +--- + | : + | : + | $21 + | $20 + | $19 on startup === `userf' + | $18 on startup === `startup' + | $17 on startup === `pt' + | $16 on startup === `cleanup' + | <a3> + | <a2> + | <a1> + | <a0> <--- sp + +--- + + Note: if we wanted to, we could muck about and try to get the 4 + argument registers loaded in to, e.g., $22, $23, $30, and $31, + and the return pc in, say, $20. Then, the first 4 args would + not need to be loaded from memory, they could just use + register-to-register copies. */ + + +/* Stack must be doubleword aligned. */ +#define QUICKTHREADS_STKALIGN (8) /* Doubleword aligned. */ + +/* How much space is allocated to hold all the crud for + initialization: $16-$23, $30, $31. Just do an integer restore, + no need to restore floating-point. Four words are needed for the + argument save area for the helper function that will be called for + the old thread, just before the new thread starts to run. */ + +#define QUICKTHREADS_STKBASE (14 * 4) +#define QUICKTHREADS_VSTKBASE QUICKTHREADS_STKBASE + + +/* Offsets of various registers. */ +#define QUICKTHREADS_31 (9+4) +#define QUICKTHREADS_19 (3+4) +#define QUICKTHREADS_18 (2+4) +#define QUICKTHREADS_17 (1+4) +#define QUICKTHREADS_16 (0+4) + + +/* When a never-before-run thread is restored, the return pc points + to a fragment of code that starts the thread running. For + non-vargs functions, it just calls the client's `only' function. + For varargs functions, it calls the startup, user, and cleanup + functions. + + The varargs startup routine always reads 4 words of arguments from + the stack. If there are less than 4 words of arguments, then the + startup routine can read off the top of the stack. To prevent + errors we always allocate 4 words. If there are more than 3 words + of arguments, the 4 preallocated words are simply wasted. */ + +extern void qt_start(void); +#define QUICKTHREADS_ARGS_MD(sp) (QUICKTHREADS_SPUT (sp, QUICKTHREADS_31, qt_start)) + +#define QUICKTHREADS_VARGS_MD0(sp, vabytes) \ + ((qt_t *)(((char *)(sp)) - 4*4 - QUICKTHREADS_STKROUNDUP(vabytes))) + +extern void qt_vstart(void); +#define QUICKTHREADS_VARGS_MD1(sp) (QUICKTHREADS_SPUT (sp, QUICKTHREADS_31, qt_vstart)) + +#define QUICKTHREADS_VARGS_DEFAULT + + +/* The *index* (positive offset) of where to put each value. */ +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_19) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_18) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_17) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_16) + +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_16) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_19) +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_18) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_17) + +#endif /* ndef QUICKTHREADS_MIPS_H */ diff --git a/ext/systemc/src/sysc/qt/md/mips.s b/ext/systemc/src/sysc/qt/md/mips.s new file mode 100644 index 000000000..b074b98dc --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/mips.s @@ -0,0 +1,164 @@ +/* mips.s -- assembly support. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* Callee-save $16-$23, $30-$31. + * + * On startup, restore regs so retpc === call to a function to start. + * We're going to call a function ($4) from within this routine. + * We're passing 3 args, therefore need to allocate 12 extra bytes on + * the stack for a save area. The start routine needs a like 16-byte + * save area. Must be doubleword aligned (_mips r3000 risc + * architecture_, gerry kane, pg d-23). + */ + + .globl qt_block + .globl qt_blocki + .globl qt_abort + .globl qt_start + .globl qt_vstart + + /* + ** $4: ptr to function to call once curr is suspended + ** and control is on $7's stack. + ** $5: 1'th arg to $4. + ** $6: 2'th arg to $4 + ** $7: sp of thread to suspend. + ** + ** Totally gross hack: The MIPS calling convention reserves + ** 4 words on the stack for a0..a3. This routine "ought" to + ** allocate space for callee-save registers plus 4 words for + ** the helper function, but instead we use the 4 words + ** provided by the function that called us (we don't need to + ** save our argument registers). So what *appears* to be + ** allocating only 40 bytes is actually allocating 56, by + ** using the caller's 16 bytes. + ** + ** The helper routine returns a value that is passed on as the + ** return value from the blocking routine. Since we don't + ** touch $2 between the helper's return and the end of + ** function, we get this behavior for free. + */ +qt_blocki: + sub $sp,$sp,40 /* Allocate reg save space. */ + sw $16, 0+16($sp) + sw $17, 4+16($sp) + sw $18, 8+16($sp) + sw $19,12+16($sp) + sw $20,16+16($sp) + sw $21,20+16($sp) + sw $22,24+16($sp) + sw $23,28+16($sp) + sw $30,32+16($sp) + sw $31,36+16($sp) + add $2, $sp,$0 /* $2 <= old sp to pass to func@$4. */ +qt_abort: + add $sp, $7,$0 /* $sp <= new sp. */ + .set noreorder + jal $31,$4 /* Call helper func@$4 . */ + add $4, $2,$0 /* $a0 <= pass old sp as a parameter. */ + .set reorder + lw $31,36+16($sp) /* Restore callee-save regs... */ + lw $30,32+16($sp) + lw $23,28+16($sp) + lw $22,24+16($sp) + lw $21,20+16($sp) + lw $20,16+16($sp) + lw $19,12+16($sp) + lw $18, 8+16($sp) + lw $17, 4+16($sp) + lw $16, 0+16($sp) /* Restore callee-save */ + + add $sp,$sp,40 /* Deallocate reg save space. */ + j $31 /* Return to caller. */ + + /* + ** Non-varargs thread startup. + ** Note: originally, 56 bytes were allocated on the stack. + ** The thread restore routine (_blocki/_abort) removed 40 + ** of them, which means there is still 16 bytes for the + ** argument area required by the MIPS calling convention. + */ +qt_start: + add $4, $16,$0 /* Load up user function pu. */ + add $5, $17,$0 /* ... user function pt. */ + add $6, $18,$0 /* ... user function userf. */ + jal $31,$19 /* Call `only'. */ + j qt_error + + + /* + ** Save calle-save floating-point regs $f20-$f30 + ** See comment in `qt_block' about calling conventinos and + ** reserved space. Use the same trick here, but here we + ** actually have to allocate all the bytes since we have to + ** leave 4 words leftover for `qt_blocki'. + ** + ** Return value from `qt_block' is the same as the return from + ** `qt_blocki'. We get that for free since we don't touch $2 + ** between the return from `qt_blocki' and the return from + ** `qt_block'. + */ +qt_block: + sub $sp, $sp,56 /* 6 8-byte regs, saved ret pc, aligned. */ + swc1 $f20, 0+16($sp) + swc1 $f22, 8+16($sp) + swc1 $f24, 16+16($sp) + swc1 $f26, 24+16($sp) + swc1 $f28, 32+16($sp) + swc1 $f30, 40+16($sp) + sw $31, 48+16($sp) + jal qt_blocki + lwc1 $f20, 0+16($sp) + lwc1 $f22, 8+16($sp) + lwc1 $f24, 16+16($sp) + lwc1 $f26, 24+16($sp) + lwc1 $f28, 32+16($sp) + lwc1 $f30, 40+16($sp) + lw $31, 48+16($sp) + add $sp, $sp,56 + j $31 + + + /* + ** First, call `startup' with the `pt' argument. + ** + ** Next, call the user's function with all arguments. + ** Note that we don't know whether args were passed in + ** integer regs, fp regs, or on the stack (See Gerry Kane + ** "MIPS R2000 RISC Architecture" pg D-22), so we reload + ** all the registers, possibly with garbage arguments. + ** + ** Finally, call `cleanup' with the `pt' argument and with + ** the return value from the user's function. It is an error + ** for `cleanup' to return. + */ +qt_vstart: + add $4, $17,$0 /* `pt' is arg0 to `startup'. */ + jal $31, $18 /* Call `startup'. */ + + add $sp, $sp,16 /* Free extra save space. */ + lw $4, 0($sp) /* Load up args. */ + lw $5, 4($sp) + lw $6, 8($sp) + lw $7, 12($sp) + lwc1 $f12, 0($sp) /* Load up fp args. */ + lwc1 $f14, 8($sp) + jal $31,$19 /* Call `userf'. */ + + add $4, $17,$0 /* `pt' is arg0 to `cleanup'. */ + add $5, $2,$0 /* Ret. val is arg1 to `cleanup'. */ + jal $31, $16 /* Call `cleanup'. */ + + j qt_error diff --git a/ext/systemc/src/sysc/qt/md/mips_b.s b/ext/systemc/src/sysc/qt/md/mips_b.s new file mode 100644 index 000000000..5b3740843 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/mips_b.s @@ -0,0 +1,99 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .globl b_call_reg + .globl b_call_imm + .globl b_add + .globl b_load + + .ent b_null +b_null: + j $31 + .end b_null + + .ent b_call_reg +b_call_reg: + la $5,b_null + add $6, $31,0 +$L0: + jal $5 + jal $5 + jal $5 + jal $5 + jal $5 + + sub $4, $4,5 + bgtz $4,$L0 + j $6 + .end + + + .ent b_call_imm +b_call_imm: + add $6, $31,0 +$L1: + jal b_null + jal b_null + jal b_null + jal b_null + jal b_null + + sub $4, $4,5 + bgtz $4,$L1 + j $6 + .end + + + .ent b_add +b_add: + add $5, $0,$4 + add $6, $0,$4 + add $7, $0,$4 + add $8, $0,$4 +$L2: + sub $4, $4,5 + sub $5, $5,5 + sub $6, $6,5 + sub $7, $7,5 + sub $8, $8,5 + + sub $4, $4,5 + sub $5, $5,5 + sub $6, $6,5 + sub $7, $7,5 + sub $8, $8,5 + + bgtz $4,$L2 + j $31 + .end + + + .ent b_load +b_load: +$L3: + ld $0, 0($sp) + ld $0, 4($sp) + ld $0, 8($sp) + ld $0, 12($sp) + ld $0, 16($sp) + + ld $0, 20($sp) + ld $0, 24($sp) + ld $0, 28($sp) + ld $0, 32($sp) + ld $0, 36($sp) + + sub $4, $4,10 + bgtz $4,$L3 + j $31 + .end diff --git a/ext/systemc/src/sysc/qt/md/null.README b/ext/systemc/src/sysc/qt/md/null.README new file mode 100644 index 000000000..e69de29bb --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/null.README diff --git a/ext/systemc/src/sysc/qt/md/null.c b/ext/systemc/src/sysc/qt/md/null.c new file mode 100644 index 000000000..db1a593ed --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/null.c @@ -0,0 +1,14 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +char const qtmd_rcsid[] = "$Header: /Users/acg/CVSROOT/systemc-2.3/src/sysc/qt/md/null.c,v 1.1.1.1 2006/12/15 20:20:06 acg Exp $"; diff --git a/ext/systemc/src/sysc/qt/md/null.s b/ext/systemc/src/sysc/qt/md/null.s new file mode 100644 index 000000000..8a2361f9e --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/null.s @@ -0,0 +1,12 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ diff --git a/ext/systemc/src/sysc/qt/md/powerpc.README b/ext/systemc/src/sysc/qt/md/powerpc.README new file mode 100644 index 000000000..b98da8b27 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc.README @@ -0,0 +1,27 @@ + +PowerPC assembly support + + +1) MacOS X, Darwin, MKLinux and other systems based on Mach kernel ABI: + + - Configuration command: ./config powerpc-darwin + + - See documentation inside powerpc_mach.h, powerpc_mach.s, powerpc.c. + + +2) LinuxPPC, and other systems based on System V ABI: + + - Configuration command: ./config powerpc + + - See documentation inside powerpc_sys5.h, powerpc_sys5.s, powerpc.c. + + +Marco Bucci <marco.bucci@inwind.it> +December 2002 + + + * This software is largely based on the original PowerPC-Linux porting + * developed by Ken Aaker <kenaaker@silverbacksystems.com> + * + * Marco Bucci <marco.bucci@inwind.it> + * December 2002 diff --git a/ext/systemc/src/sysc/qt/md/powerpc.c b/ext/systemc/src/sysc/qt/md/powerpc.c new file mode 100644 index 000000000..fb374f3f2 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc.c @@ -0,0 +1,69 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + +#include <stdarg.h> +#include "qt.h" + +// This static is used to find the end of the stack for variable + +static void *qt_sp_bottom_save; + +/* We actually don't know how the compiler accomodates arguments in the + * va_list. In some implementation (e.g. Linux PPC) we cannot scan the + * list as an array. To avoid this problem, this version of "qt_varg", + * retrieves arguments by means of the standard "va_arg" macro defined + * in stdargs.h. + * + * Notice that we still suppose that the number of arguments is given + * by nbytes/sizeof(qt_word_t) and we load the stack of "qt_vstart" + * assuming that all parameters are alligned to the size of qt_word_t. + * + * Marco Bucci <marco.bucci@inwind.it> + * December 2002 + */ + +/* + +qt_t *qt_vargs (qt_t *sp, int nbytes, void *vargs, + void *pt, qt_startup_t *startup, + qt_vuserf_t *vuserf, qt_cleanup_t *cleanup) + +*/ + + qt_t * +qt_vargs_stdarg (qt_t *sp, int nbytes, va_list vargs, + void *pt, qt_startup_t *startup, + qt_vuserf_t *vuserf, qt_cleanup_t *cleanup) + + + +{ + int i; + qt_word_t arg; + + sp = QUICKTHREADS_VARGS_MD0 (sp, nbytes); + + for ( i=0;i<(int)(nbytes/sizeof(qt_word_t)); i++) + { + arg = va_arg(vargs, qt_word_t); + QUICKTHREADS_SPUT (QUICKTHREADS_VARGS_ADJUST(sp), i, arg); + } + + QUICKTHREADS_VARGS_MD1 (QUICKTHREADS_VADJ(sp)); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VARGT_INDEX, pt); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VSTARTUP_INDEX, startup); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VUSERF_INDEX, vuserf); + QUICKTHREADS_SPUT (QUICKTHREADS_VADJ(sp), QUICKTHREADS_VCLEANUP_INDEX, cleanup); + return ((qt_t *)QUICKTHREADS_VADJ(sp)); +} diff --git a/ext/systemc/src/sysc/qt/md/powerpc_mach.h b/ext/systemc/src/sysc/qt/md/powerpc_mach.h new file mode 100644 index 000000000..677808c5c --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_mach.h @@ -0,0 +1,611 @@ +/* + + * QuickThreads -- Threads-building toolkit. + + * Copyright (c) 1993 by David Keppel + + * + + * Permission to use, copy, modify and distribute this software and + + * its documentation for any purpose and without fee is hereby + + * granted, provided that the above copyright notice and this notice + + * appear in all copies. This software is provided as a + + * proof-of-concept and for demonstration purposes; there is no + + * representation about the suitability of this software for any + + * purpose. + + * + + + * PowerPC-Mach thread switching module. + + * + + * This software is largely based on the original PowerPC-Linux porting + + * developed by Ken Aaker <kenaaker@silverbacksystems.com> + + * + + * Marco Bucci <marco.bucci@inwind.it> + + * December 2002 + + * + + */ + + +#ifndef QUICKTHREADS_POWERPC_H +#define QUICKTHREADS_POWERPC_H + + +/***************************************************************************** + * + * DESCRIPTION + * + * This is the QuickThreads switching module implementation for PowerPC + * running under Mach kernel. It was developed and tested under MacOS X, that + * is under Darwin (the UNIX-BSD fundation of MacOS X). + * + * Notice that the Mach PowerPC ABI (Application Binary Interface) [1] is + * not the same than System V ABI [2] used by most of the LINUX PowerPC + * implementations. + * + * IMPLEMENTATION NOTES + * + * 1) Porting on System V ABI + * Excluding the variant argument calling convention, Mach and System V ABI + * are enough similar and it could be possible to use some simple macro, to + * adapt the code for both the ABIs. Actually, the only relevant difference + * is in the linkage area structure and in the position where the Link and + * the Condition registers are saved. As to the calling conventions, there + * are differences with floating points argument passing and with variant + * argument lists. Notice that, on Mach, the caller's stack frame allocates + * space to hold all arguments ([1] p.51), while on System V, the caller's + * stack frame allocates space to hold just the arguments that don't fit into + * registers ([2] p.3.18). + * + * 2) Variant argument list implementation + * Variant argument calling on a RISC machine is not easy to implement since + * parameters are passed via registers instead of via stack. In a general + * variant argument implementation, the caller's stack must map the whole + * parameter list following the rules related to the use of the GPR and FPR + * parameter registers and the stack alignment ([1] p.54). + * This implementation is quite simple and not general. It works under the + * hypothesis that arguments are 4-bytes aligned integers. + * + * 3) This heather file organisation + * I preferred to not make confusion between macros that are needed (i.e. + * directly used) by QuickThreads and internal "implementation" macros. You + * will find QuickThreds macros in the end of this header. Sometime they just + * refer to an analogous "internal" macro. On the top, there are the macros + * that I used to make more clean (I hope) the implementation. I could include + * some system heather (as to stack layout definitions, prologs and epilogs, + * etc.), but I preferred to have a self-contained heather in order to make + * all more clear for mantaining and for possible porting on another ABI. + * + * + * REFERENCES + * + * [1] - Mach-O Runtime Architecture + * Runtime Concepts and Conventions for Mac OS X Programs + * Preliminary July 2002 + * + * [2] - SYSTEM V APPLICATION BINARY INTERFACE + * PowerPC Processor Supplement + * September 1995 + * + * On MacOS X, more documentation is available by installing the "Developer + * Tools". Useful macros and documentation can be found in the system headers + * files such as asm.h, asm_help.h etc. (see /usr/architecture/ppc/ or + * /System/Library/Frameworks/Kernel.framework/Headers/architecture/ppc/). + + *****************************************************************************/ + +/***************************************************************************** + * + * PowerPC Mach-O Stack frame (see [1]) + * + + ................ + + + + | | reserved + + CALLER'S LINKAGE AREA + + | | Caller's LR + + + + | | Caller's CR + + + + backchain -> | | Caller's backchain + +==========================+ + | | FPR31 + + FPR SAVE AREA + + .............. + + + + | | FPRn + +--------------------------+ + | | GPR31 + + GPR SAVE AREA + + .............. + + + + | | GPRn + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | PAR(n) + + + + | | + + PARAMETER AREA + + .............. + + for FUTURE call + + | | PAR(1) + + + + SP + 24 -> | | PAR(0) + +--------------------------+ + SP + 20 -> | | Caller's TOC + + + + SP + 16 -> | | reserved + + + + SP + 12 -> | | reserved + + LINKAGE AREA + + SP + 8 -> | | LR callee-save for FUTURE call + + + + SP + 4 -> | | CR callee-save for FUTURE call + + + + SP -> | | backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + * NOTE: + * + * 1) Parameter are allocated in the CALLER's parameter area. This area must + * be large enough to hold all parameters regardless if they are or not passed + * in registers. + * + * The caller parameter area is used: + * - by the caller, to store parameters to the callee that cannot fit in + * registers (no more parameter registers are available); + * - by the callee, to save parameter registers (for istance because they are + * needed for a further call). + * + * Obviously, the callee saves parameter registers, in the location in which + * they are mapped on the caller's stack frame. So, be aware that, if + * something else is stored in that location, it could be deleted after a call. + * + * 2) The callee saves LR and CR in the caller's linkage area. All other + * callee's state are saved in its own stack frame. + * + + *****************************************************************************/ + + +/***************************************************************************** + * + * Stack initialization for a single argument thread + * + + + top + QUICKTHREADS_STKBASE -> STACK BOTTOM (higher address) + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + top + QUICKTHREADS_ONLY_INDEX * 4 -> | only param | PAR(3) + + + + top + QUICKTHREADS_USER_INDEX * 4 -> | userf param | PAR(2) + + + + top + QUICKTHREADS_ARGT_INDEX * 4 -> | t param | PAR(1) + + + + top + QUICKTHREADS_ARGU_INDEX * 4 -> | u param | PAR(0) + +--------------------------+ + | | + + + + .............. + + + + top + QUICKTHREADS_RETURN_INDEX * 4 -> | qt_start | LR save + + + + .............. + + + + top + QUICKTHREADS_BLOCKI_FRAME_SIZE -> | top + QUICKTHREADS_STKBASE | backchain + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + | | + + + + .............. + + + + top -> |top + QUICKTHREADS_BLOCKI_FRAME_SIZE| backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + ***************************************************************************** + * + * Stack initialization for a variant argument thread + * + + bottom -> STACK BOTTOM (higher address) + +==========================+ + | | + + + + .............. + + + + top + QUICKTHREADS_VSTKBASE -> | arg(0) | PAR(4) + +--------------------------+ + top + QUICKTHREADS_CLEANUP_INDEX * 4 -> | cleanup param | PAR(3) + + + + top + QUICKTHREADS_USER_INDEX * 4 -> | userf param | PAR(2) + + + + top + QUICKTHREADS_VSTARTUP_INDEX * 4 ->| startup param | PAR(1) + + + + top + QUICKTHREADS_ARGT_INDEX * 4 -> | t param | PAR(0) + +--------------------------+ + | | + + + + .............. + + + + top + QUICKTHREADS_RETURN_INDEX * 4 -> | qt_start | LR save + + + + .............. + top + QUICKTHREADS_BLOCKI_FRAME_SIZE -> | top + QUICKTHREADS_STKBASE | backchain + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + | | + + + + .............. + + + + top -> |top + QUICKTHREADS_BLOCKI_FRAME_SIZE| backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + +* NOTE: +* +* Parameters are passed to "qt_start" or to "qt_vstart" putting them into +* the stack frames of "qt_start" or "qt_vstart" themselves. This not a +* conventional parameter passing because parameters should be put into the +* caller's stack, not into the callee's one. Actually we must consider +* that as a preload of the parameter area that "qt_start" or "qt_vstart" +* will use for their own calls. +* Be aware of the fact that, during a call, the caller's parameter area is, +* in a certain sense, volatile. In facts, the callee can save parameter +* registers on the caller's parameter area. +* + *****************************************************************************/ + + +/***************************************************************************** + + Define PowerPC Mach-O related macros + + *****************************************************************************/ + + + +typedef unsigned long PPC_W; + +/* Stack pointer must always be a multiple of 16 */ +#define PPC_STACK_INCR 16 +#define PPC_ROUND_STACK(length) \ + (((length)+PPC_STACK_INCR-1) & ~(PPC_STACK_INCR-1)) + + +#define PPC_LINKAGE_AREA 24 +#define PPC_CR_SAVE 4 +#define PPC_LR_SAVE 8 + +#define PPC_PARAM_AREA(n) (4*(n)) + +#define PPC_GPR_SAVE_AREA (4*19) /* GPR13-GPR31 must be saved */ +#define PPC_FPR_SAVE_AREA (8*18) /* FPR14-FPR31 must be saved */ + +/* Define parameter offset on the stack. + * NOTICE: Parameters are numbered 0, 1, ..., n. +*/ +#define PPC_PAR(i) (PPC_LINKAGE_AREA+(i)*4) + +/***************************************************************************** + + Define stack frames + + *****************************************************************************/ + + +/* Define the "qt_blocki" and "qt_abort" stack frame. We use the same stack + * frame for both. + * + + top + S -> + +==========================+ + top + S - 4 -> | | GPR31 + + GPR SAVE AREA + + .............. + + + + top + S - 19 * 4 -> | | GPR13 + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | + + + + | | + + PARAMETER AREA + + | | + + + + top + 24 -> | | + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + */ + +#define QUICKTHREADS_BLOCKI_FRAME_SIZE \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)+PPC_GPR_SAVE_AREA) + +/* Offset to the base of the GPR save area. Save from GPR13 to GPR31 + * increasing address. + */ +#define QUICKTHREADS_BLOCKI_GPR_SAVE(i) (QUICKTHREADS_BLOCKI_FRAME_SIZE-4+(i-31)*4) + + + +/* Define the "qt_block" stack frame. Notice that since "qt_black" calls + * "qt_blocki", GPR registers are saved into "qt_blocki" stack frame. + * + + top + S -> + +==========================+ + top + S - 8 -> | | FPR31 + + FPR SAVE AREA + + .............. + + + + top + S - 18 * 8 -> | | FPR14 + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | + + + + | | + + PARAMETER AREA + + | | + + + + top + 24 -> | | + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + */ + +#define QUICKTHREADS_BLOCK_FRAME_SIZE \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)+PPC_FPR_SAVE_AREA) + +/* Offset to the location where registers are saved. + */ +#define QUICKTHREADS_BLOCK_FPR_SAVE(i) (QUICKTHREADS_BLOCK_FRAME_SIZE-8+(i-31)*8) + + +/* Define the "qt_start" frame size. It consists just of the linkage area and + * the parameter area. + * + + +==========================+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | only par + + + + | | userf par + + PARAMETER AREA + + | | t par + + + + top + 24 -> | | u par + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + + */ +#define QUICKTHREADS_START_FRAME_SIZE PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)) + + + +/* Define the "qt_vstart" frame. It consists of the linkage area, the fix parameter + * area, the variant argument list and a local variable area used in "qt_vstart" + * implementation. + * + + backchain -> + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + | | arg(1) + + + + top + 24 + 16 -> | | arg(0) + +--------------------------+ + | | cleanup par + + + + | | userf par + + PARAMETER AREA + + | | startup par + + + + top + 24 -> | | t par + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + + */ +#define QUICKTHREADS_VARGS_LOCAL_AREA (4*4) /* local variable area */ + +/* The offset the stack will be moved back before to call "userf(...)". + * The linckage area must be moved to be adiacent to the part of the variant + * argument list that is in the stack. + */ +#define QUICKTHREADS_VARGS_BKOFF PPC_PARAM_AREA(4) + +#define QUICKTHREADS_VSTART_FRAME_SIZE(varbytes) \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)+(varbytes)+ \ + QUICKTHREADS_VARGS_LOCAL_AREA) + +/* Offset to the base of the varian argument list */ +#define QUICKTHREADS_VSTART_LIST_BASE (PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)) + + +/* Notice that qt_start and qt_vstart have no parameters, actually their + * parameters are written in their stack frame during thread initialization + */ +extern void qt_start(void); +extern void qt_vstart(void); + + + +/* Offset (in words) of the location where the block routine saves its return + * address (i.e. LR). SP points the top of the block routine stack and, + * following ppc calling conventions, the return address is saved in the + * previous (caller's) stack frame. + */ +#define QUICKTHREADS_RETURN_INDEX ((QUICKTHREADS_BLOCKI_FRAME_SIZE+PPC_LR_SAVE)/sizeof(PPC_W)) + +/* static variable used to get the stack bottom in "VARGS" initialization */ +/* static void *qt_sp_bottom_save; */ + +#define QUICKTHREADS_ARG_INDEX(i) ((QUICKTHREADS_BLOCKI_FRAME_SIZE+PPC_PAR(i))/sizeof(PPC_W)) + +/***************************************************************************** + + QuickThreads needed definitions + + *****************************************************************************/ + + +#define QUICKTHREADS_GROW_DOWN +#define QUICKTHREADS_STKALIGN PPC_STACK_INCR +typedef PPC_W qt_word_t; + + +/* This macro is used by "QUICKTHREADS_ARGS" to initialize a single argument thread. + * - set "qt_start" as the "qt_block" or "qt_blocki" return address; + * - set the top of the stack backchain; + * - set the next backchain (not needed, but just to be "clean"). + */ +#define QUICKTHREADS_ARGS_MD(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_RETURN_INDEX, qt_start), \ + QUICKTHREADS_SPUT (sp, 0, sp+QUICKTHREADS_BLOCKI_FRAME_SIZE), \ + QUICKTHREADS_SPUT (sp, QUICKTHREADS_BLOCKI_FRAME_SIZE/sizeof(PPC_W), \ + sp+QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_START_FRAME_SIZE)) + + +/* This macro is used by "QUICKTHREADS_VARGS" to initialize a variant argument thread. + * It returns the pointer to the top of the argument list. + * We also use it to get the stack bottom via a static variable. This is a bit + * "dirty", it could be better to do it in "qt_vargs", but we don't want change + * anything out of this file. + * We need the stack bottom to allocate a local variable area used by + * "qt_vstart". + */ +#define QUICKTHREADS_VARGS_MD0(sp, varbytes) \ + ((qt_sp_bottom_save = sp), \ + ((qt_t *)(((char *)(sp)) - \ + (QUICKTHREADS_VSTART_FRAME_SIZE(varbytes)-QUICKTHREADS_VSTART_LIST_BASE)))) + + +/* This macro is used by "QUICKTHREADS_VARGS" to initialize a variant argument thread. + * - set "qt_start" as the "qt_block" or "qt_blocki" return address; + * - set the top of the stackback chain; + * - set the next backchain (it points the stack botton). + */ +#define QUICKTHREADS_VARGS_MD1(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_RETURN_INDEX, qt_vstart), \ + QUICKTHREADS_SPUT (sp, 0, sp+QUICKTHREADS_BLOCKI_FRAME_SIZE), \ + QUICKTHREADS_SPUT (sp, (QUICKTHREADS_BLOCKI_FRAME_SIZE)/sizeof(PPC_W), \ + qt_sp_bottom_save)) + + +/* Activate "qt_vargs" as the initialization routine for the variant + * argument threads + */ +#define QUICKTHREADS_VARGS_DEFAULT + +/* Override "qt_vargs" with "qt_vargs_stdarg". + * On LinuxPPC "qt_vargs" doesn't work, "qt_vargs_stdarg" uses a more + * standard way to retrieve arguments from the variant list. + */ +#define QUICKTHREADS_VARGS(sp, nbytes, vargs, pt, startup, vuserf, cleanup) \ + ((qt_t *)qt_vargs_stdarg (sp, nbytes, vargs, pt, startup, vuserf, cleanup)) + + +/* This macro is used by "QUICKTHREADS_ADJ(sp)" to get the stack top form the stack + * bottom during a single argument thread initialization. + * It is the space we need to allocate for a single argument thread: the stack + * frame for the block routine ("qt_block" or "qt_blocki") and for "qt_start". + */ +#define QUICKTHREADS_STKBASE \ + (QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_START_FRAME_SIZE) + +/* This macro is used by "QUICKTHREADS_VADJ(sp)" to get the stack top from the base + * of the variant argument list during a variant argument thread initialization. + */ +#define QUICKTHREADS_VSTKBASE (QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_VSTART_LIST_BASE) + +/* The *index* (positive offset) of where to put each value. */ + +#define QUICKTHREADS_ARGU_INDEX QUICKTHREADS_ARG_INDEX(0) +#define QUICKTHREADS_ARGT_INDEX QUICKTHREADS_ARG_INDEX(1) +#define QUICKTHREADS_USER_INDEX QUICKTHREADS_ARG_INDEX(2) +#define QUICKTHREADS_ONLY_INDEX QUICKTHREADS_ARG_INDEX(3) + + +#define QUICKTHREADS_VARGT_INDEX QUICKTHREADS_ARG_INDEX(0) +#define QUICKTHREADS_VSTARTUP_INDEX QUICKTHREADS_ARG_INDEX(1) +#define QUICKTHREADS_VUSERF_INDEX QUICKTHREADS_ARG_INDEX(2) +#define QUICKTHREADS_VCLEANUP_INDEX QUICKTHREADS_ARG_INDEX(3) + +#endif /* ndef QUICKTHREADS_POWERPC_H */ + diff --git a/ext/systemc/src/sysc/qt/md/powerpc_mach.s b/ext/systemc/src/sysc/qt/md/powerpc_mach.s new file mode 100644 index 000000000..63414b05d --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_mach.s @@ -0,0 +1,641 @@ +/* powerpc_mach.s -- assembly support. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + + + * PowerPC-Mach thread switching module. + * Darwin (MacOS X) assembly + * + * NOTICE: Syntax for register names is not the GNU one. Register are + * named "rx" and "fx", not "%rx" and "%fx" as usual for the GNU "as" tool. + * Darwin "as" tool is based on GNU "as" but follows the "official" PowerPC + * syntax. + * + * + * This software is largely based on the original PowerPC-Linux porting + * developed by Ken Aaker <kenaaker@silverbacksystems.com> + * + * Marco Bucci <marco.bucci@inwind.it> + * December 2002 + * + */ + + +/* + * + * PowerPC Register convections: + * + * r0 volatile + * r1 SP + * r2 system reserved + * r3-r4 volatile for parameter passing and function return + * r5-r10 volatile for parameter passing + * r11-r12 volatile + * r13-r14 non volatile registers + * f0 volatile + * f1 volatile for parameter passing and function return + * f2-f13 volatile for parameter passing + * f14-f31 non volatile + * + * cr2-cr4 non volatile + * + * + * See on the heather file for more documentation. + * + * + * + * IMPLEMENTATION NOTES + * + * + * 1) Condition register saving + * On most machines, the condition code register is caller-save. + * On the PPC, the condition code register is callee-save, so the + * thread context switch must preserve it. + * + * + * 2) Floating point registers saving + * On resuming a thread, floating point registers are or not restored just + * depending on which block routine suspended the thread (i.e. regardless + * whether "qt_block", "qt_blocki" or "qt_abort" is used to resume it). + * This behaviour is obtained by implementing "qt_block" by means af a nested + * call to "qt_blocki". As a result, the blocking of a thread always goes + * and returns through "qt_blocki and, if a thread was blocked by "qt_block", + * its execution resumes from the floating point restoring code on exit + * of "qt_block". + * + * Thanks to David Keppel that explained me this "simple" trick. + * + * + * 3) C languace code debugging + * This software was developed and debugged using the Metrowerks + * Code Warrior PPC integrated assembler. It can be still used with the + * Code Warrior compiler by means of the file "powerpc_mach_asm_debug.c" + * that include it. + * In order to avoid "copy and paste" bugs, and make easyer the maintaining, + * I made the minimal changes, so you can find some strange code as: + * + * #if 0 + * .if 0 + * C code here + * .endif + * #endif + * + * This is just to embed some C code that is needed by the Code Warrior + * integrated assembler. + * + * + * 4) Assembly constants generation + * Constants used in the assembly code are generated by running + * the C code in the sequel (commented). It uses the C macros declared in + * the C heather in order to guarantee that the C interface and the assebly + * code are "aligned". I avoided the use of an assebler preprocessor since + * they are not so standard and moreover using macro espressions makes the + * assembly debugging more difficult. + * + * + + +#include <iostream> +#include "powerpc_mach.h" + +int main() +{ + using namespace std; + + int i; + + cout << ".set LR_SAVE, " << PPC_LR_SAVE << endl; + cout << ".set CR_SAVE, " << PPC_CR_SAVE << endl; + cout << ".set BLOCKI_FSIZE, " << QUICKTHREADS_BLOCKI_FRAME_SIZE << endl; + cout << ".set BLOCK_FSIZE, " << QUICKTHREADS_BLOCK_FRAME_SIZE << endl; + + cout << endl; + for(i=0; i<12; i++) + cout << ".set PAR_" << i << ", " << PPC_PAR(i) << endl; + + cout << endl; + i = 13; + cout << ".set GPR_SAVE_" << i << ", " << QUICKTHREADS_BLOCKI_GPR_SAVE(i) << endl; + + cout << endl; + for(i=31; i>13; i--) + cout << ".set FPR_SAVE_" << i << ", " << QUICKTHREADS_BLOCK_FPR_SAVE(i) << endl; + + cout << endl; + cout << ".set VARGS_BKOFF, " << QUICKTHREADS_VARGS_BKOFF << endl; + + + cout << endl << endl << endl; + + for(i=31; i>13; i--) + cout << "\tstfd\tf" << i << ",FPR_SAVE_" << i << "(r1)" << endl; + + cout << endl; + for(i=31; i>13; i--) + cout << "\tlfd \tf" << i << ",FPR_SAVE_" << i << "(r1)" << endl; + + cout << endl << endl << endl; + + + return 0; +} + + + * + * + * + */ + + +#if 0 + + .text + .align 4 + + .globl qt_block + .globl _qt_block + .globl qt_blocki + .globl _qt_blocki + .globl qt_abort + .globl _qt_abort + .globl qt_start + .globl _qt_start + .globl qt_vstart + .globl _qt_vstart + + +.set LR_SAVE, 8 +.set CR_SAVE, 4 +.set BLOCKI_FSIZE, 128 +.set BLOCK_FSIZE, 192 + +.set PAR_0, 24 +.set PAR_1, 28 +.set PAR_2, 32 +.set PAR_3, 36 +.set PAR_4, 40 +.set PAR_5, 44 +.set PAR_6, 48 +.set PAR_7, 52 +.set PAR_8, 56 +.set PAR_9, 60 +.set PAR_10, 64 +.set PAR_11, 68 + +.set GPR_SAVE_13, 52 + +.set FPR_SAVE_31, 184 +.set FPR_SAVE_30, 176 +.set FPR_SAVE_29, 168 +.set FPR_SAVE_28, 160 +.set FPR_SAVE_27, 152 +.set FPR_SAVE_26, 144 +.set FPR_SAVE_25, 136 +.set FPR_SAVE_24, 128 +.set FPR_SAVE_23, 120 +.set FPR_SAVE_22, 112 +.set FPR_SAVE_21, 104 +.set FPR_SAVE_20, 96 +.set FPR_SAVE_19, 88 +.set FPR_SAVE_18, 80 +.set FPR_SAVE_17, 72 +.set FPR_SAVE_16, 64 +.set FPR_SAVE_15, 56 +.set FPR_SAVE_14, 48 + + +/* various offsets used by "qt_varg" */ +.set P_T, PAR_0 +.set P_STARTUP, PAR_1 +.set P_USERF, PAR_2 +.set P_CLEANUP, PAR_3 + /* the offset used to move back the linkage area to be adiacent to + * the variant argument list before calling "userf(...) */ +.set VARGS_BKOFF, 16 /* skip "t", "startup", "userf" and "cleanup" */ + + /* location where "t" and "cleanup" are saved (with respect of + * the stack frame base) */ +.set P_T_SAVE, -4 +.set P_CLEANUP_SAVE, -8 + +#endif + + + +/* Block the current thread saving all integer non volatile registers and + * start a new thread. + */ +#if 0 +.if 0 +#endif +void *qt_blocki (void *helper, void *a0, void *a1, void *newthread); +asm void *qt_blocki (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +#if 0 +qt_blocki: +_qt_blocki: +#endif +/* prolog code */ + stwu r1,-BLOCKI_FSIZE(r1) /* allocate the stack frame */ + mflr r0 /* return addr in r0 */ + mfcr r11 /* CR in r11 */ + stw r0,LR_SAVE+BLOCKI_FSIZE(r1) /* save return addr in the stack */ + stw r11,CR_SAVE+BLOCKI_FSIZE(r1) /* save CR in the stack */ + stmw r13,GPR_SAVE_13(r1) /* save non-volatile reg */ + +/* call helper(qt_t *old, void *a0, void *a1) */ + mtlr r3 /* "helper" addr in the link reg */ + mr r3,r1 /* current thread (i.e. the SP) in arg "old" */ + mr r1,r6 /* swap to the new thread (i.e. to its SP) */ + blrl /* jump to "helper" */ +/* the "helper" return value is returned (since r3 is not changed) */ + +/* epilog code: return to the new thread's "qt_blocki" caller */ + lmw r13,GPR_SAVE_13(r1) /* restore non-volatile reg */ + lwz r0,LR_SAVE+BLOCKI_FSIZE(r1) /* recover return addr */ + lwz r11,CR_SAVE+BLOCKI_FSIZE(r1) /* recover CR */ + mtlr r0 /* return address in the link reg */ + mtcr r11 /* restore CR */ + addi r1,r1,BLOCKI_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Abort the current thread and start a new thread. + */ +#if 0 +.if 0 +#endif +void qt_abort (void *helper, void *a0, void *a1, void *newthread); +asm void qt_abort (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +#if 0 +qt_abort: +_qt_abort: +#endif +/* prolog code */ +/* there is no prolog. It will never come back */ + +/* call helper(qt_t *old, void *a0, void *a1) */ + mtlr r3 /* "helper" addr in the link reg */ + mr r1,r6 /* swap to the new thread (i.e. to its SP) */ +/* we don't need to set "old", we can pass just garbage. Actually, since r3 + is not changed, "old" is set to "helper" (don't care) */ + blrl /* call "helper" */ +/* the "helper" return value is returned (since r3 is not changed) */ + +/* epilog code: return to the new thread's "qt_blocki" caller */ + lmw r13,GPR_SAVE_13(r1) /* restore non-volatile reg */ + lwz r0,LR_SAVE+BLOCKI_FSIZE(r1) /* recover return addr */ + lwz r11,CR_SAVE+BLOCKI_FSIZE(r1) /* recover CR */ + mtlr r0 /* return address in the link reg */ + mtcr r11 /* restore CR */ + addi r1,r1,BLOCKI_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Block the current thread saving all non volatile registers and start + * a new thread. + */ +#if 0 +.if 0 +#endif +void *qt_block (void *helper, void *a0, void *a1, void *newthread); +asm void *qt_block (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +# if 0 +qt_block: +_qt_block: +#endif +/* prolog code */ + stwu r1,-BLOCK_FSIZE(r1) /* allocate the stack frame */ + mflr r0 /* return addr in r0 */ + stw r0,LR_SAVE+BLOCK_FSIZE(r1) /* save return addr in the stack */ + +/* save non-volatile fp reg */ + stfd f31,FPR_SAVE_31(r1) + stfd f30,FPR_SAVE_30(r1) + stfd f29,FPR_SAVE_29(r1) + stfd f28,FPR_SAVE_28(r1) + stfd f27,FPR_SAVE_27(r1) + stfd f26,FPR_SAVE_26(r1) + stfd f25,FPR_SAVE_25(r1) + stfd f24,FPR_SAVE_24(r1) + stfd f23,FPR_SAVE_23(r1) + stfd f22,FPR_SAVE_22(r1) + stfd f21,FPR_SAVE_21(r1) + stfd f20,FPR_SAVE_20(r1) + stfd f19,FPR_SAVE_19(r1) + stfd f18,FPR_SAVE_18(r1) + stfd f17,FPR_SAVE_17(r1) + stfd f16,FPR_SAVE_16(r1) + stfd f15,FPR_SAVE_15(r1) + stfd f14,FPR_SAVE_14(r1) +/* block the thread */ + bl qt_blocki +/* the thread is going to be resumed */ +/* restore non-volatile fp reg */ + lfd f31,FPR_SAVE_31(r1) + lfd f30,FPR_SAVE_30(r1) + lfd f29,FPR_SAVE_29(r1) + lfd f28,FPR_SAVE_28(r1) + lfd f27,FPR_SAVE_27(r1) + lfd f26,FPR_SAVE_26(r1) + lfd f25,FPR_SAVE_25(r1) + lfd f24,FPR_SAVE_24(r1) + lfd f23,FPR_SAVE_23(r1) + lfd f22,FPR_SAVE_22(r1) + lfd f21,FPR_SAVE_21(r1) + lfd f20,FPR_SAVE_20(r1) + lfd f19,FPR_SAVE_19(r1) + lfd f18,FPR_SAVE_18(r1) + lfd f17,FPR_SAVE_17(r1) + lfd f16,FPR_SAVE_16(r1) + lfd f15,FPR_SAVE_15(r1) + lfd f14,FPR_SAVE_14(r1) + + lwz r0,LR_SAVE+BLOCK_FSIZE(r1) /* recover return addr */ + mtlr r0 /* return address in the link reg */ + addi r1,r1,BLOCK_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Start a single argument thread using parameters preloaded in the stack + * during thread initialization (see comments on stack initialization in the + * heather file). + * + * Executes: + * + * only(u, t, userf); + */ +#if 0 +.if 0 +#endif +void qt_start(void); +asm void qt_start(void) +{ +#if 0 +.endif +#endif + +#if 0 +qt_start: +_qt_start: +#endif + lwz r3,PAR_0(r1) /* "u" in r3 */ + lwz r4,PAR_1(r1) /* "t" in r4 */ + lwz r5,PAR_2(r1) /* "userf" in r5 */ + lwz r6,PAR_3(r1) /* "only" in r6 */ + mtlr r6 /* "only" address in the link reg */ +/* call only(u, t, userf) */ + blrl /* jump to "only" */ +/* error if it returns */ + b _qt_error +/* dead code (some inline asm "wants" the epilog, or they genetare it) */ + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Start a variant argument thread using parameters preloaded in the stack + * during thread initialization (see comments on stack initialization in the + * heather file). + * + * Executes: + * + * startup(t); + * userf_return = userf(...); + * cleanup(pt, userf_return); + * + + + ***** Stack layout on start ***** + + + backchain -> STACK BOTTOM (higher address) + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + SP + PAR(5) -> | | arg(1) + + + + SP + PAR(4) -> | | arg(0) + +--------------------------+ + SP + PAR(3) -> | | cleanup par + + + + SP + PAR(2) -> | | userf par + + PARAMETER AREA + + SP + PAR(1) -> | | startup par + + + + SP + PAR(0) -> | | t par + +--------------------------+ + | | + + LINKAGE AREA + + SP -> | | + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + + + ***** Stack layout before call userf ***** + + + backchain -> STACK BOTTOM (higher address) + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + SP + PAR(1) -> | | arg(1) + + + + SP + PAR(0) -> | | arg(0) + +--------------------------+ + | | + + LINKAGE AREA + + SP -> | | + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + + * To call "userf(...)", the argument list must be adiacent to the linkage + * area. Instead of copy the argument list, we move back the linkage area + * (actually, we just increase the SP and copy the backchain). "t" and + * "cleanup" are saved in a local variable area in order to call + * cleanup(pt, userf_return). + +*/ + + +#if 0 +.if 0 +#endif +void qt_vstart(void); +asm void qt_vstart(void) +{ +#if 0 +.endif +#endif + +#if 0 +qt_vstart: +_qt_vstart: +#endif +/* NOTICE: the callee routines could save parameter registers in the caller's + * stack parameter area. We put "t" in PAR(0) in such a way, if startup(t) + * will save "t", it will be saved on the same location thus not delething + * any other parameter. + */ + +/* since we will move back the linckage area (to make it adiacent to the + * parameter list), we need to save "t" and "cleanup". We have made room for + * this on the bottom of the stack frame. */ + +/* save parameters in the local variable area */ + lwz r11,0(r1) /* get the backchain */ + lwz r3,P_T(r1) + lwz r4,P_CLEANUP(r1) + stw r3,P_T_SAVE(r11) /* save "pt" */ + stw r4,P_CLEANUP_SAVE(r11) /* save "cleanup" */ + +/* call startup(t) */ + lwz r5,P_STARTUP(r1) + mtlr r5 + blrl /* call "startup" */ + +/* call userf(...) */ + lwz r11,0(r1) /* reload backchain (r11 is volatile) */ + lwz r4,P_USERF(r1) /* load "userf" */ + mtlr r4 + + /* first eight parameter of the variant list must be copyed in + * GPR3-GPR10. There is a four places offset due to "t", "startup", + * userf" and "cleanup" */ + + lwz r3,PAR_4(r1) + lwz r4,PAR_5(r1) + lwz r5,PAR_6(r1) + lwz r6,PAR_7(r1) + lwz r7,PAR_8(r1) + lwz r8,PAR_9(r1) + lwz r9,PAR_10(r1) + lwz r10,PAR_11(r1) + + + /* move the linkage area to be adiacent to the argument list */ + stw r11,VARGS_BKOFF(r1) /* copy backchain */ + addi r1,r1,VARGS_BKOFF /* move back the stack */ + + blrl /* call "userf" */ + +/* call qt_cleanup(void *pt, void *vuserf_return) */ + lwz r11,0(r1) /* reload backchain (r11 is volatile) */ + + mr r4,r3 /* push "userf" return as 2nd parameter */ + lwz r3,P_T_SAVE(r11) /* reload "pt" */ + lwz r5,P_CLEANUP_SAVE(r11) /* reload "cleanup" */ + mtlr r5 + blrl + b _qt_error +/* dead code (some inline asm "wanst" the epilog, or they genetare it) */ + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + diff --git a/ext/systemc/src/sysc/qt/md/powerpc_mach_b.s b/ext/systemc/src/sysc/qt/md/powerpc_mach_b.s new file mode 100644 index 000000000..f0fd23fcb --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_mach_b.s @@ -0,0 +1,290 @@ +/* speed test for basic CPU operations */ + + +/* Marco Bucci <marco.bucci@inwind.it> */ + +/* This code was developed with the Code Warrior integrate ppc assembler. + * Macros are use to hide illegal constructs whether you are using a + * "normal" assembler or the "C integrated" assembler. + */ + +#if 0 + + + .text + .align 4 + + .globl b_call_reg + .globl _b_call_reg + .globl b_call_imm + .globl _b_call_imm + .globl b_add + .globl _b_add + .globl b_load + .globl _b_load + +.set fsize, 64 +.set lrsave, 8 + +#else + +#define fsize 64 +#define lrsave 8 + +#endif + + + + +#if 0 +.if 0 +#endif +asm void b_null(void) +{ +#if 0 +.endif +#endif + +#if 0 +b_null: +#endif + + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + +/* actually the same as the following. How to get "b_null" address? + * I didnt find the right sintax or the right way. + * I should take the current PC, then the difference to "b_null" + * (making the difference beween the labels), perform the sum and go?! + */ +#if 0 +.if 0 +#endif +asm void b_call_reg(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_call_reg: +_b_call_reg: +#endif + + mflr r0 + stw r31,-4(r1) + stw r30,-8(r1) + stw r0,lrsave(r1) + stwu r1,-fsize(r1) + mr r30,r3 + li r31,0 + + b L1 +L0: + bl b_null + bl b_null + bl b_null + bl b_null + bl b_null + + addi r31,r31,5 +L1: + cmpw r31,r30 + blt L0 + + + lwz r0,lrsave+fsize(r1) + mtlr r0 + lwz r31,-4+fsize(r1) + lwz r30,-8+fsize(r1) + addi r1,r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + + +#if 0 +.if 0 +#endif +asm void b_call_imm(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_call_imm: +_b_call_imm: +#endif + + mflr r0 + stw r31,-4(r1) + stw r30,-8(r1) + stw r0,lrsave(r1) + stwu r1,-fsize(r1) + mr r30,r3 + li r31,0 + + b L3 +L2: + bl b_null + bl b_null + bl b_null + bl b_null + bl b_null + + addi r31,r31,5 +L3: + cmpw r31,r30 + blt L2 + + + lwz r0,lrsave+fsize(r1) + mtlr r0 + lwz r31,-4+fsize(r1) + lwz r30,-8+fsize(r1) + addi r1,r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +#if 0 +.if 0 +#endif +asm void b_add(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_add: +_b_add: +#endif + + mflr r0 + stw r31,-4(r1) + stw r30,-8(r1) + stw r0,lrsave(r1) + stwu r1,-fsize(r1) + mr r30,r3 + li r31,0 + + b L5 +L4: + addi r3,r3,5 + addi r4,r4,5 + addi r5,r5,5 + addi r6,r6,5 + addi r7,r7,5 + + addi r3,r3,5 + addi r4,r4,5 + addi r5,r5,5 + addi r6,r6,5 + addi r7,r7,5 + + addi r31,r31,10 +L5: + cmpw r31,r30 + blt L4 + + + lwz r0,lrsave+fsize(r1) + mtlr r0 + lwz r31,-4+fsize(r1) + lwz r30,-8+fsize(r1) + addi r1,r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +#if 0 +.if 0 +#endif +asm void b_load(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_load: +_b_load: +#endif + + mflr r0 + stw r31,-4(r1) + stw r30,-8(r1) + stw r0,lrsave(r1) + stwu r1,-fsize(r1) + mr r30,r3 + li r31,0 + + b L7 +L6: + lwz r3,4(r1) + lwz r4,8(r1) + lwz r5,12(r1) + lwz r6,16(r1) + lwz r7,20(r1) + + lwz r3,24(r1) + lwz r4,28(r1) + lwz r5,32(r1) + lwz r6,36(r1) + lwz r7,40(r1) + + + addi r31,r31,10 +L7: + cmpw r31,r30 + blt L6 + + + lwz r0,lrsave+fsize(r1) + mtlr r0 + lwz r31,-4+fsize(r1) + lwz r30,-8+fsize(r1) + addi r1,r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif diff --git a/ext/systemc/src/sysc/qt/md/powerpc_sys5.h b/ext/systemc/src/sysc/qt/md/powerpc_sys5.h new file mode 100644 index 000000000..8c0730704 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_sys5.h @@ -0,0 +1,566 @@ +/* + + * QuickThreads -- Threads-building toolkit. + + * Copyright (c) 1993 by David Keppel + + * + + * Permission to use, copy, modify and distribute this software and + + * its documentation for any purpose and without fee is hereby + + * granted, provided that the above copyright notice and this notice + + * appear in all copies. This software is provided as a + + * proof-of-concept and for demonstration purposes; there is no + + * representation about the suitability of this software for any + + * purpose. + + * + + + * PowerPC-Sys5 thread switching module. + + * + + * This software is largely based on the original PowerPC-Linux porting + + * developed by Ken Aaker <kenaaker@silverbacksystems.com> + + * + + * Marco Bucci <marco.bucci@inwind.it> + + * December 2002 + + * + + */ + + +#ifndef QUICKTHREADS_POWERPC_H +#define QUICKTHREADS_POWERPC_H + + +/***************************************************************************** + * + * DESCRIPTION + * + * This is the QuickThreads switching module implementation for PowerPC + * running under System V ABI (Application Binary Interface) [2]. It was + * developed by porting the MacOS X version and tested under LinuxPPC. + * + * Notice that this is not the same than the PowerPC Mach ABI used by MacOSX + * [1]. + * + * IMPLEMENTATION NOTES + * + * 1) Porting on System V ABI + * Excluding the variant argument calling convention, Mach and System V ABI + * are enough similar and it could be possible to use some simple macro, to + * adapt the code for both the ABIs. Actually, the only relevant difference + * is in the linkage area structure and in the position where the Link and + * the Condition registers are saved. As to the calling conventions, there + * are differences with floating points argument passing and with variant + * argument lists. Notice that, on Mach, the caller's stack frame allocates + * space to hold all arguments ([1] p.51), while on System V, the caller's + * stack frame allocates space to hold just the arguments that don't fit into + * registers ([2] p.3.18). + * + * 2) Variant argument list implementation + * Variant argument calling on a RISC machine is not easy to implement since + * parameters are passed via registers instead of via stack. In a general + * variant argument implementation, the caller's stack must map the whole + * parameter list following the rules related to the use of the GPR and FPR + * parameter registers and the stack alignment ([2] p.3-21). + * This implementation is quite simple and not general. It works under the + * hypothesis that arguments are 4-bytes aligned integers. + * + * 3) This heather file organisation + * I preferred to not make confusion between macros that are needed (i.e. + * directly used) by QuickThreads and internal "implementation" macros. You + * will find QuickThreds macros in the end of this header. Sometime they just + * refer to an analogous "internal" macro. On the top, there are the macros + * that I used to make more clean (I hope) the implementation. I could include + * some system heather (as to stack layout definitions, prologs and epilogs, + * etc.), but I preferred to have a self-contained heather in order to make + * all more clear for mantaining and for possible porting on another ABI. + * + * + * REFERENCES + * + * [1] - Mach-O Runtime Architecture + * Runtime Concepts and Conventions for Mac OS X Programs + * Preliminary July 2002 + * + * [2] - SYSTEM V APPLICATION BINARY INTERFACE + * PowerPC Processor Supplement + * September 1995 + * + + *****************************************************************************/ + +/***************************************************************************** + * + * PowerPC System V Stack frame (see [2]) + * + + ................ + + + + | | + +--------------------------+ + | | Caller's LR + + CALLER'S LINKAGE AREA + + backchain -> | | Caller's backchain + +==========================+ + | | FPR31 + + FPR SAVE AREA + + .............. + + + + | | FPRn + +--------------------------+ + | | GPR31 + + GPR SAVE AREA + + .............. + + + + | | GPRn + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | CR SAVE | + +--------------------------+ + | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | PAR(n-7) + + + + | | + + PARAMETER AREA + + .............. + + for FUTURE call + + | | PAR(9) + + + + SP + 8 -> | | PAR(8) + +--------------------------+ + SP + 4 -> | | LR callee-save for FUTURE call + + LINKAGE AREA + + SP -> | | backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + + * NOTE: + * + * 1) In this figure parameter are supposed to be integer 4-bytes aligned and + * are numbered 0, 1, 2,... n. + * + * 2) Parameter are allocated in the CALLER's parameter area. This area must + * be large enough to hold all parameters that cannot fit in registers (no + * more parameter registers are available); + * + * 3) The callee saves LR in the caller's linkage area. CR as all other + * callee's state are saved in its own stack frame. + * + + *****************************************************************************/ + + +/***************************************************************************** + * + * Stack initialization for a single argument thread + * + + + top + QUICKTHREADS_STKBASE -> STACK BOTTOM (higher address) + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + top + QUICKTHREADS_ONLY_INDEX * 4 -> | only param | PAR(3) + + + + top + QUICKTHREADS_USER_INDEX * 4 -> | userf param | PAR(2) + + + + top + QUICKTHREADS_ARGT_INDEX * 4 -> | t param | PAR(1) + + + + top + QUICKTHREADS_ARGU_INDEX * 4 -> | u param | PAR(0) + +--------------------------+ + top + QUICKTHREADS_RETURN_INDEX * 4 -> | qt_start | LR save + + + + top + QUICKTHREADS_BLOCKI_FRAME_SIZE -> | top + QUICKTHREADS_STKBASE | backchain + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + | | + + + + top -> |top + QUICKTHREADS_BLOCKI_FRAME_SIZE| backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + ***************************************************************************** + * + * Stack initialization for a variant argument thread + * + + bottom -> STACK BOTTOM (higher address) + +==========================+ + | | + + + + .............. + + + + top + QUICKTHREADS_VSTKBASE -> | arg(0) | PAR(4) + +--------------------------+ + top + QUICKTHREADS_CLEANUP_INDEX * 4 -> | cleanup param | PAR(3) + + + + top + QUICKTHREADS_USER_INDEX * 4 -> | userf param | PAR(2) + + + + top + QUICKTHREADS_VSTARTUP_INDEX * 4 ->| startup param | PAR(1) + + + + top + QUICKTHREADS_ARGT_INDEX * 4 -> | t param | PAR(0) + +--------------------------+ + top + QUICKTHREADS_RETURN_INDEX * 4 -> | qt_start | LR save + + + + top + QUICKTHREADS_BLOCKI_FRAME_SIZE -> | top + QUICKTHREADS_STKBASE | backchain + +==========================+ + | | + + + + .............. + + + + | | + +--------------------------+ + | | + + + + top -> |top + QUICKTHREADS_BLOCKI_FRAME_SIZE| backchain + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + +* NOTE: +* +* Parameters are passed to "qt_start" or to "qt_vstart" putting them into +* the stack frames of "qt_start" or "qt_vstart" themselves. This not a +* conventional parameter passing because parameters should be put into the +* caller's stack, not into the callee's one. Actually we must consider +* that as a preload of the parameter area that "qt_start" or "qt_vstart" +* will use for their own calls. +* Be aware of the fact that, during a call, the caller's parameter area is, +* in a certain sense, volatile. In facts, the callee can save parameter +* registers on the caller's parameter area. +* + *****************************************************************************/ + + +/***************************************************************************** + + Define PowerPC System V related macros + + *****************************************************************************/ + + + +typedef unsigned long PPC_W; + +/* Stack pointer must always be a multiple of 16 */ +#define PPC_STACK_INCR 16 +#define PPC_ROUND_STACK(length) \ + (((length)+PPC_STACK_INCR-1) & ~(PPC_STACK_INCR-1)) + + +#define PPC_LINKAGE_AREA 8 +#define PPC_LR_SAVE 4 + +#define PPC_PARAM_AREA(n) (4*(n)) + +#define PPC_GPR_SAVE_AREA (4*19) /* GPR13-GPR31 must be saved */ +#define PPC_FPR_SAVE_AREA (8*18) /* FPR14-FPR31 must be saved */ + +/* Define parameter offset on the stack. + * NOTICE: Parameters are numbered 0, 1, ..., n. +*/ +#define PPC_PAR(i) (PPC_LINKAGE_AREA+(i)*4) + +/***************************************************************************** + + Define stack frames + + *****************************************************************************/ + + +/* Define the "qt_blocki" and "qt_abort" stack frame. We use the same stack + * frame for both. + * + + top + S -> + +==========================+ + top + S - 4 -> | | GPR31 + + GPR SAVE AREA + + .............. + + + + top + S - 19 * 4 -> | | GPR13 + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + top + 8 -> | CR SAVE | + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + */ + +#define QUICKTHREADS_BLOCKI_FRAME_SIZE \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+4+PPC_GPR_SAVE_AREA) + +#define QUICKTHREADS_BLOCKI_CR_SAVE 8 + +/* Offset to the base of the GPR save area. Save from GPR13 to GPR31 + * increasing address. + */ +#define QUICKTHREADS_BLOCKI_GPR_SAVE(i) (QUICKTHREADS_BLOCKI_FRAME_SIZE-4+(i-31)*4) + + + +/* Define the "qt_block" stack frame. Notice that since "qt_black" calls + * "qt_blocki", GPR registers are saved into "qt_blocki" stack frame. + * + + top + S -> + +==========================+ + top + S - 8 -> | | FPR31 + + FPR SAVE AREA + + .............. + + + + top + S - 18 * 8 -> | | FPR14 + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + */ + +#define QUICKTHREADS_BLOCK_FRAME_SIZE \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_FPR_SAVE_AREA) + +/* Offset to the location where registers are saved. + */ +#define QUICKTHREADS_BLOCK_FPR_SAVE(i) (QUICKTHREADS_BLOCK_FRAME_SIZE-8+(i-31)*8) + + +/* Define the "qt_start" frame size. It consists just of the linkage area and + * the parameter area. + * + + +==========================+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | only par + + + + | | userf par + + PARAMETER AREA + + | | t par + + + + top + 8 -> | | u par + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + + */ +#define QUICKTHREADS_START_FRAME_SIZE PPC_ROUND_STACK(PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)) + + + +/* Define the "qt_vstart" frame. It consists of the linkage area, the fix parameter + * area, the variant argument list and a local variable area used in "qt_vstart" + * implementation. + * + + backchain -> + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + | | arg(1) + + + + top + 8 + 16 -> | | arg(0) + +--------------------------+ + | | cleanup par + + + + | | userf par + + PARAMETER AREA + + | | startup par + + + + top + 8 -> | | t par + +--------------------------+ + | | + + LINKAGE AREA + + top -> | | + +==========================+ + + */ +#define QUICKTHREADS_VARGS_LOCAL_AREA (4*4) /* local variable area */ + +/* The offset the stack will be moved back before to call "userf(...)". + * The linckage area must be moved to be adiacent to the part of the variant + * argument list that is in the stack. Notice that, since the first 8 + * parameters are passed via registers, the offset is equal to the size of + * 4+8 parameters. */ +#define QUICKTHREADS_VARGS_BKOFF PPC_PARAM_AREA(4+8) + +#define QUICKTHREADS_VSTART_FRAME_SIZE(varbytes) \ + PPC_ROUND_STACK(PPC_LINKAGE_AREA+QUICKTHREADS_VARGS_BKOFF+(varbytes)+ \ + QUICKTHREADS_VARGS_LOCAL_AREA) + +/* Offset to the base of the varian argument list */ +#define QUICKTHREADS_VSTART_LIST_BASE (PPC_LINKAGE_AREA+PPC_PARAM_AREA(4)) + + +/* Notice that qt_start and qt_vstart have no parameters, actually their + * parameters are written in their stack frame during thread initialization + */ +extern void qt_start(void); +extern void qt_vstart(void); + + + +/* Offset (in words) of the location where the block routine saves its return + * address (i.e. LR). SP points the top of the block routine stack and, + * following ppc calling conventions, the return address is saved in the + * previous (caller's) stack frame. + */ +#define QUICKTHREADS_RETURN_INDEX ((QUICKTHREADS_BLOCKI_FRAME_SIZE+PPC_LR_SAVE)/sizeof(PPC_W)) + +/* static variable used to get the stack bottom in "VARGS" initialization */ +static void *qt_sp_bottom_save; + +#define QUICKTHREADS_ARG_INDEX(i) ((QUICKTHREADS_BLOCKI_FRAME_SIZE+PPC_PAR(i))/sizeof(PPC_W)) + +/***************************************************************************** + + QuickThreads needed definitions + + *****************************************************************************/ + + +#define QUICKTHREADS_GROW_DOWN +#define QUICKTHREADS_STKALIGN PPC_STACK_INCR +typedef PPC_W qt_word_t; + + +/* This macro is used by "QUICKTHREADS_ARGS" to initialize a single argument thread. + * - set "qt_start" as the "qt_block" or "qt_blocki" return address; + * - set the top of the stack backchain; + * - set the next backchain (not needed, but just to be "clean"). + */ +#define QUICKTHREADS_ARGS_MD(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_RETURN_INDEX, qt_start), \ + QUICKTHREADS_SPUT (sp, 0, sp+QUICKTHREADS_BLOCKI_FRAME_SIZE), \ + QUICKTHREADS_SPUT (sp, QUICKTHREADS_BLOCKI_FRAME_SIZE/sizeof(PPC_W), \ + sp+QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_START_FRAME_SIZE)) + + +/* This macro is used by "QUICKTHREADS_VARGS" to initialize a variant argument thread. + * It returns the pointer to the top of the argument list. + * We also use it to get the stack bottom via a static variable. This is a bit + * "dirty", it could be better to do it in "qt_vargs", but we don't want change + * anything out of this file. + * We need the stack bottom to allocate a local variable area used by + * "qt_vstart". + */ +#define QUICKTHREADS_VARGS_MD0(sp, varbytes) \ + ((qt_sp_bottom_save = sp), \ + ((qt_t *)(((char *)(sp)) - \ + (QUICKTHREADS_VSTART_FRAME_SIZE(varbytes)-QUICKTHREADS_VSTART_LIST_BASE)))) + + +/* This macro is used by "QUICKTHREADS_VARGS" to initialize a variant argument thread. + * - set "qt_start" as the "qt_block" or "qt_blocki" return address; + * - set the top of the stackback chain; + * - set the next backchain (it points the stack botton). + */ +#define QUICKTHREADS_VARGS_MD1(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_RETURN_INDEX, qt_vstart), \ + QUICKTHREADS_SPUT (sp, 0, sp+QUICKTHREADS_BLOCKI_FRAME_SIZE), \ + QUICKTHREADS_SPUT (sp, (QUICKTHREADS_BLOCKI_FRAME_SIZE)/sizeof(PPC_W), \ + qt_sp_bottom_save)) + + +/* Activate "qt_vargs" as the initialization routine for the variant + * argument threads + */ +#define QUICKTHREADS_VARGS_DEFAULT + +/* Override "qt_vargs" with "qt_vargs_stdarg". + * On LinuxPPC "qt_vargs" doesn't work, "qt_vargs_stdarg" uses a more + * standard way to retrieve arguments from the variant list. + */ +#define QUICKTHREADS_VARGS(sp, nbytes, vargs, pt, startup, vuserf, cleanup) \ + ((qt_t *)qt_vargs_stdarg (sp, nbytes, vargs, pt, startup, vuserf, cleanup)) + + +/* This macro is used by "QUICKTHREADS_ADJ(sp)" to get the stack top form the stack + * bottom during a single argument thread initialization. + * It is the space we need to allocate for a single argument thread: the stack + * frame for the block routine ("qt_block" or "qt_blocki") and for "qt_start". + */ +#define QUICKTHREADS_STKBASE \ + (QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_START_FRAME_SIZE) + +/* This macro is used by "QUICKTHREADS_VADJ(sp)" to get the stack top from the base + * of the variant argument list during a variant argument thread initialization. + */ +#define QUICKTHREADS_VSTKBASE (QUICKTHREADS_BLOCKI_FRAME_SIZE+QUICKTHREADS_VSTART_LIST_BASE) + +/* The *index* (positive offset) of where to put each value. */ + +#define QUICKTHREADS_ARGU_INDEX QUICKTHREADS_ARG_INDEX(0) +#define QUICKTHREADS_ARGT_INDEX QUICKTHREADS_ARG_INDEX(1) +#define QUICKTHREADS_USER_INDEX QUICKTHREADS_ARG_INDEX(2) +#define QUICKTHREADS_ONLY_INDEX QUICKTHREADS_ARG_INDEX(3) + + +#define QUICKTHREADS_VARGT_INDEX QUICKTHREADS_ARG_INDEX(0) +#define QUICKTHREADS_VSTARTUP_INDEX QUICKTHREADS_ARG_INDEX(1) +#define QUICKTHREADS_VUSERF_INDEX QUICKTHREADS_ARG_INDEX(2) +#define QUICKTHREADS_VCLEANUP_INDEX QUICKTHREADS_ARG_INDEX(3) + +#endif /* ndef QUICKTHREADS_POWERPC_H */ + diff --git a/ext/systemc/src/sysc/qt/md/powerpc_sys5.s b/ext/systemc/src/sysc/qt/md/powerpc_sys5.s new file mode 100644 index 000000000..d9dc9332d --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_sys5.s @@ -0,0 +1,639 @@ +/* powerpc-sys5.s -- assembly support. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + + + * PowerPC-System V thread switching module. + * + * This software is largely based on the original PowerPC-Linux porting + * developed by Ken Aaker <kenaaker@silverbacksystems.com> + * + * Marco Bucci <marco.bucci@inwind.it> + * December 2002 + * + */ + + +/* + * + * PowerPC Register convections: + * + * r0 volatile + * r1 SP + * r2 system reserved + * r3-r4 volatile for parameter passing and function return + * r5-r10 volatile for parameter passing + * r11-r12 volatile + * r13-r14 non volatile registers + * f0 volatile + * f1 volatile for parameter passing and function return + * f2-f13 volatile for parameter passing + * f14-f31 non volatile + * + * cr2-cr4 non volatile + * + * + * See on the heather file for more documentation. + * + * + * + * IMPLEMENTATION NOTES + * + * + * 1) Condition register saving + * On most machines, the condition code register is caller-save. + * On the PPC, the condition code register is callee-save, so the + * thread context switch must preserve it. + * + * + * 2) Floating point registers saving + * On resuming a thread, floating point registers are or not restored just + * depending on which block routine suspended the thread (i.e. regardless + * whether "qt_block", "qt_blocki" or "qt_abort" is used to resume it). + * This behaviour is obtained by implementing "qt_block" by means af a nested + * call to "qt_blocki". As a result, the blocking of a thread always goes + * and returns through "qt_blocki and, if a thread was blocked by "qt_block", + * its execution resumes from the floating point restoring code on exit + * of "qt_block". + * + * Thanks to David Keppel that explained me this "simple" trick. + * + * + * 3) C languace code debugging + * The original version of this software was developed and debugged under + * MacOS X using the Metrowerks Code Warrior PPC integrated assembler. + * It could be still used with a C inline assembler by means of a suitable + * file to include it. + * In order to avoid "copy and paste" bugs, and make easyer the maintaining, + * I made the minimal changes, so you can find some strange code as: + * + * #if 0 + * .if 0 + * C code here + * .endif + * #endif + * + * This is just to embed some C code that is needed by the Code Warrior + * integrated assembler. + * + * + * 4) Assembly constants generation + * Constants used in the assembly code are generated by running + * the C code in the sequel (commented). It uses the C macros declared in + * the C heather in order to guarantee that the C interface and the assebly + * code are "aligned". I avoided the use of an assebler preprocessor since + * they are not so standard and moreover using macro espressions makes the + * assembly debugging more difficult. + * + * + + +#include <iostream> +#include "powerpc_sys5.h" + +int main() +{ + using namespace std; + + int i; + + cout << ".set LR_SAVE, " << PPC_LR_SAVE << endl; + cout << ".set BLOCKI_FSIZE, " << QUICKTHREADS_BLOCKI_FRAME_SIZE << endl; + cout << ".set BLOCKI_CR_SAVE, " << QUICKTHREADS_BLOCKI_CR_SAVE << endl; + cout << ".set BLOCK_FSIZE, " << QUICKTHREADS_BLOCK_FRAME_SIZE << endl; + + cout << endl; + for(i=0; i<12; i++) + cout << ".set PAR_" << i << ", " << PPC_PAR(i) << endl; + + cout << endl; + i = 13; + cout << ".set GPR_SAVE_" << i << ", " << QUICKTHREADS_BLOCKI_GPR_SAVE(i) << endl; + + cout << endl; + for(i=31; i>13; i--) + cout << ".set FPR_SAVE_" << i << ", " << QUICKTHREADS_BLOCK_FPR_SAVE(i) << endl; + + cout << endl; + cout << ".set VARGS_BKOFF, " << QUICKTHREADS_VARGS_BKOFF << endl; + + + cout << endl << endl << endl; + + for(i=31; i>13; i--) + cout << "\tstfd\tf" << i << ",FPR_SAVE_" << i << "(%r1)" << endl; + + cout << endl; + for(i=31; i>13; i--) + cout << "\tlfd \tf" << i << ",FPR_SAVE_" << i << "(%r1)" << endl; + + cout << endl << endl << endl; + + + return 0; +} + + + + * + * + * + */ + + +#if 0 + + .text + .align 4 + + .globl qt_block + .globl _qt_block + .globl qt_blocki + .globl _qt_blocki + .globl qt_abort + .globl _qt_abort + .globl qt_start + .globl _qt_start + .globl qt_vstart + .globl _qt_vstart + + +.set LR_SAVE, 4 +.set BLOCKI_FSIZE, 96 +.set BLOCKI_CR_SAVE, 8 /* CR is saved into the callee's stack frame */ +.set BLOCK_FSIZE, 160 + +.set PAR_0, 8 +.set PAR_1, 12 +.set PAR_2, 16 +.set PAR_3, 20 +.set PAR_4, 24 +.set PAR_5, 28 +.set PAR_6, 32 +.set PAR_7, 36 +.set PAR_8, 40 +.set PAR_9, 44 +.set PAR_10, 48 +.set PAR_11, 52 + +.set GPR_SAVE_13, 20 + +.set FPR_SAVE_31, 152 +.set FPR_SAVE_30, 144 +.set FPR_SAVE_29, 136 +.set FPR_SAVE_28, 128 +.set FPR_SAVE_27, 120 +.set FPR_SAVE_26, 112 +.set FPR_SAVE_25, 104 +.set FPR_SAVE_24, 96 +.set FPR_SAVE_23, 88 +.set FPR_SAVE_22, 80 +.set FPR_SAVE_21, 72 +.set FPR_SAVE_20, 64 +.set FPR_SAVE_19, 56 +.set FPR_SAVE_18, 48 +.set FPR_SAVE_17, 40 +.set FPR_SAVE_16, 32 +.set FPR_SAVE_15, 24 +.set FPR_SAVE_14, 16 + + + + +/* various offsets used by "qt_varg" */ +.set P_T, PAR_0 +.set P_STARTUP, PAR_1 +.set P_USERF, PAR_2 +.set P_CLEANUP, PAR_3 + /* the offset used to move back the linkage area to be adiacent to + * the variant argument list before calling "userf(...). + * Skip "t", "startup", "userf", "cleanup" and first + * 8 parameters (since they are passed via registers) */ +.set VARGS_BKOFF, 48 + + /* location where "t" and "cleanup" are saved (with respect of + * the stack frame base) */ +.set P_T_SAVE, -4 +.set P_CLEANUP_SAVE, -8 + +#endif + + + +/* Block the current thread saving all integer non volatile registers and + * start a new thread. + */ +#if 0 +.if 0 +#endif +void *qt_blocki (void *helper, void *a0, void *a1, void *newthread); +asm void *qt_blocki (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +#if 0 +qt_blocki: +_qt_blocki: +#endif +/* prolog code */ + stwu %r1,-BLOCKI_FSIZE(%r1) /* allocate the stack frame */ + mflr %r0 /* return addr in r0 */ + mfcr %r11 /* CR in r11 */ + stw %r0,LR_SAVE+BLOCKI_FSIZE(%r1) /* save return addr in the stack */ + stw %r11,BLOCKI_CR_SAVE(%r1) /* save CR in the stack */ + stmw %r13,GPR_SAVE_13(%r1) /* save non-volatile reg */ + +/* call helper(qt_t *old, void *a0, void *a1) */ + mtlr %r3 /* "helper" addr in the link reg */ + mr %r3,%r1 /* current thread (i.e. the SP) in arg "old" */ + mr %r1,%r6 /* swap to the new thread (i.e. to its SP) */ + blrl /* jump to "helper" */ +/* the "helper" return value is returned (since r3 is not changed) */ + +/* epilog code: return to the new thread's "qt_blocki" caller */ + lmw %r13,GPR_SAVE_13(%r1) /* restore non-volatile reg */ + lwz %r0,LR_SAVE+BLOCKI_FSIZE(%r1) /* recover return addr */ + lwz %r11,BLOCKI_CR_SAVE(%r1) /* recover CR */ + mtlr %r0 /* return address in the link reg */ + mtcr %r11 /* restore CR */ + addi %r1,%r1,BLOCKI_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Abort the current thread and start a new thread. + */ +#if 0 +.if 0 +#endif +void qt_abort (void *helper, void *a0, void *a1, void *newthread); +asm void qt_abort (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +#if 0 +qt_abort: +_qt_abort: +#endif +/* prolog code */ +/* there is no prolog. It will never come back */ + +/* call helper(qt_t *old, void *a0, void *a1) */ + mtlr %r3 /* "helper" addr in the link reg */ + mr %r1,%r6 /* swap to the new thread (i.e. to its SP) */ +/* we don't need to set "old", we can pass just garbage. Actually, since r3 + is not changed, "old" is set to "helper" (don't care) */ + blrl /* call "helper" */ +/* the "helper" return value is returned (since r3 is not changed) */ + +/* epilog code: return to the new thread's "qt_blocki" caller */ + lmw %r13,GPR_SAVE_13(%r1) /* restore non-volatile reg */ + lwz %r0,LR_SAVE+BLOCKI_FSIZE(%r1) /* recover return addr */ + lwz %r11,BLOCKI_CR_SAVE(%r1) /* recover CR */ + mtlr %r0 /* return address in the link reg */ + mtcr %r11 /* restore CR */ + addi %r1,%r1,BLOCKI_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Block the current thread saving all non volatile registers and start + * a new thread. + */ +#if 0 +.if 0 +#endif +void *qt_block (void *helper, void *a0, void *a1, void *newthread); +asm void *qt_block (void *helper, void *a0, void *a1, void *newthread) +{ +#if 0 +.endif +#endif + +# if 0 +qt_block: +_qt_block: +#endif +/* prolog code */ + stwu %r1,-BLOCK_FSIZE(%r1) /* allocate the stack frame */ + mflr %r0 /* return addr in r0 */ + stw %r0,LR_SAVE+BLOCK_FSIZE(%r1) /* save return addr in the stack */ + +/* save non-volatile fp reg */ + stfd %f31,FPR_SAVE_31(%r1) + stfd %f30,FPR_SAVE_30(%r1) + stfd %f29,FPR_SAVE_29(%r1) + stfd %f28,FPR_SAVE_28(%r1) + stfd %f27,FPR_SAVE_27(%r1) + stfd %f26,FPR_SAVE_26(%r1) + stfd %f25,FPR_SAVE_25(%r1) + stfd %f24,FPR_SAVE_24(%r1) + stfd %f23,FPR_SAVE_23(%r1) + stfd %f22,FPR_SAVE_22(%r1) + stfd %f21,FPR_SAVE_21(%r1) + stfd %f20,FPR_SAVE_20(%r1) + stfd %f19,FPR_SAVE_19(%r1) + stfd %f18,FPR_SAVE_18(%r1) + stfd %f17,FPR_SAVE_17(%r1) + stfd %f16,FPR_SAVE_16(%r1) + stfd %f15,FPR_SAVE_15(%r1) + stfd %f14,FPR_SAVE_14(%r1) +/* block the thread */ + bl qt_blocki +/* the thread is going to be resumed */ +/* restore non-volatile fp reg */ + lfd %f31,FPR_SAVE_31(%r1) + lfd %f30,FPR_SAVE_30(%r1) + lfd %f29,FPR_SAVE_29(%r1) + lfd %f28,FPR_SAVE_28(%r1) + lfd %f27,FPR_SAVE_27(%r1) + lfd %f26,FPR_SAVE_26(%r1) + lfd %f25,FPR_SAVE_25(%r1) + lfd %f24,FPR_SAVE_24(%r1) + lfd %f23,FPR_SAVE_23(%r1) + lfd %f22,FPR_SAVE_22(%r1) + lfd %f21,FPR_SAVE_21(%r1) + lfd %f20,FPR_SAVE_20(%r1) + lfd %f19,FPR_SAVE_19(%r1) + lfd %f18,FPR_SAVE_18(%r1) + lfd %f17,FPR_SAVE_17(%r1) + lfd %f16,FPR_SAVE_16(%r1) + lfd %f15,FPR_SAVE_15(%r1) + lfd %f14,FPR_SAVE_14(%r1) + + lwz %r0,LR_SAVE+BLOCK_FSIZE(%r1) /* recover return addr */ + mtlr %r0 /* return address in the link reg */ + addi %r1,%r1,BLOCK_FSIZE /* free the stack frame */ + blr /* return */ + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Start a single argument thread using parameters preloaded in the stack + * during thread initialization (see comments on stack initialization in the + * heather file). + * + * Executes: + * + * only(u, t, userf); + */ +#if 0 +.if 0 +#endif +void qt_start(void); +asm void qt_start(void) +{ +#if 0 +.endif +#endif + +#if 0 +qt_start: +_qt_start: +#endif + lwz %r3,PAR_0(%r1) /* "u" in r3 */ + lwz %r4,PAR_1(%r1) /* "t" in r4 */ + lwz %r5,PAR_2(%r1) /* "userf" in r5 */ + lwz %r6,PAR_3(%r1) /* "only" in r6 */ + mtlr %r6 /* "only" address in the link reg */ +/* call only(u, t, userf) */ + blrl /* jump to "only" */ +/* error if it returns */ + b qt_error +/* dead code (some inline asm "wants" the epilog, or they genetare it) */ + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +/* Start a variant argument thread using parameters preloaded in the stack + * during thread initialization (see comments on stack initialization in the + * heather file). + * + * Executes: + * + * startup(t); + * userf_return = userf(...); + * cleanup(pt, userf_return); + * + + + ***** Stack layout on start ***** + + + backchain -> STACK BOTTOM (higher address) + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + SP + PAR(5) -> | | arg(1) + + + + SP + PAR(4) -> | | arg(0) + +--------------------------+ + SP + PAR(3) -> | | cleanup par + + + + SP + PAR(2) -> | | userf par + + PARAMETER AREA + + SP + PAR(1) -> | | startup par + + + + SP + PAR(0) -> | | t par + +--------------------------+ + | | + + LINKAGE AREA + + SP -> | | + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + + + ***** Stack layout before call userf ***** + + + backchain -> STACK BOTTOM (higher address) + +==========================+ + backchain - 4 -> | | + + LOCAL VARIABLES AREA + + .............. + + + + | | + +--------------------------+ + | | + + ALIGNMEBNT PAD + + .............. + + (if needed) + + | | + +--------------------------+ + | | arg(n) + + + + | | + + VARIABLE ARGUMENT LIST + + .............. + + for userf call + + SP + PAR(1) -> | | arg(1) + + + + SP + PAR(0) -> | | arg(0) + +--------------------------+ + | | + + LINKAGE AREA + + SP -> | | + +==========================+ + STACK TOP (lower address) + + Stack grows down + | + V + + + * To call "userf(...)", the argument list must be adiacent to the linkage + * area. Instead of copy the argument list, we move back the linkage area + * (actually, we just increase the SP and copy the backchain). "t" and + * "cleanup" are saved in a local variable area in order to call + * cleanup(pt, userf_return). + +*/ + + +#if 0 +.if 0 +#endif +void qt_vstart(void); +asm void qt_vstart(void) +{ +#if 0 +.endif +#endif + +#if 0 +qt_vstart: +_qt_vstart: +#endif +/* NOTICE: the callee routines could save parameter registers in the caller's + * stack parameter area. We put "t" in PAR(0) in such a way, if startup(t) + * will save "t", it will be saved on the same location thus not delething + * any other parameter. + */ + +/* since we will move back the linckage area (to make it adiacent to the + * parameter list), we need to save "t" and "cleanup". We have made room for + * this on the bottom of the stack frame. */ + +/* save parameters in the local variable area */ + lwz %r11,0(%r1) /* get the backchain */ + lwz %r3,P_T(%r1) + lwz %r4,P_CLEANUP(%r1) + stw %r3,P_T_SAVE(%r11) /* save "pt" */ + stw %r4,P_CLEANUP_SAVE(%r11) /* save "cleanup" */ + +/* call startup(t) */ + lwz %r5,P_STARTUP(%r1) + mtlr %r5 + blrl /* call "startup" */ + +/* call userf(...) */ + lwz %r11,0(%r1) /* reload backchain (r11 is volatile) */ + lwz %r4,P_USERF(%r1) /* load "userf" */ + mtlr %r4 + + /* first eight parameter of the variant list must be copyed in + * GPR3-GPR10. There is a four places offset due to "t", "startup", + * userf" and "cleanup" */ + + lwz %r3,PAR_4(%r1) + lwz %r4,PAR_5(%r1) + lwz %r5,PAR_6(%r1) + lwz %r6,PAR_7(%r1) + lwz %r7,PAR_8(%r1) + lwz %r8,PAR_9(%r1) + lwz %r9,PAR_10(%r1) + lwz %r10,PAR_11(%r1) + + + /* move the linkage area to be adiacent to the argument list */ + stw %r11,VARGS_BKOFF(%r1) /* copy backchain */ + addi %r1,%r1,VARGS_BKOFF /* move back the stack */ + + blrl /* call "userf" */ + +/* call qt_cleanup(void *pt, void *vuserf_return) */ + lwz %r11,0(%r1) /* reload backchain (r11 is volatile) */ + + mr %r4,%r3 /* push "userf" return as 2nd parameter */ + lwz %r3,P_T_SAVE(%r11) /* reload "pt" */ + lwz %r5,P_CLEANUP_SAVE(%r11) /* reload "cleanup" */ + mtlr %r5 + blrl + b qt_error +/* dead code (some inline asm "wants" the epilog, or they genetare it) */ + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + diff --git a/ext/systemc/src/sysc/qt/md/powerpc_sys5_b.s b/ext/systemc/src/sysc/qt/md/powerpc_sys5_b.s new file mode 100644 index 000000000..e57a20e2e --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/powerpc_sys5_b.s @@ -0,0 +1,290 @@ +/* speed test for basic CPU operations */ + + +/* Marco Bucci <marco.bucci@inwind.it> */ + +/* This code was developed with the Code Warrior integrate ppc assembler. + * Macros are use to hide illegal constructs whether you are using a + * "normal" assembler or the "C integrated" assembler. + */ + +#if 0 + + + .text + .align 4 + + .globl b_call_reg + .globl _b_call_reg + .globl b_call_imm + .globl _b_call_imm + .globl b_add + .globl _b_add + .globl b_load + .globl _b_load + +.set fsize, 64 +.set lrsave, 4 + +#else + +#define fsize 64 +#define lrsave 4 + +#endif + + + + +#if 0 +.if 0 +#endif +asm void b_null(void) +{ +#if 0 +.endif +#endif + +#if 0 +b_null: +#endif + + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + +/* actually the same as the following. How to get "b_null" address? + * I didnt find the right sintax or the right way. + * I should take the current PC, then the difference to "b_null" + * (making the difference beween the labels), perform the sum and go?! + */ +#if 0 +.if 0 +#endif +asm void b_call_reg(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_call_reg: +_b_call_reg: +#endif + + mflr %r0 + stw %r31,-4(%r1) + stw %r30,-8(%r1) + stw %r0,lrsave(%r1) + stwu %r1,-fsize(%r1) + mr %r30,%r3 + li %r31,0 + + b L1 +L0: + bl b_null + bl b_null + bl b_null + bl b_null + bl b_null + + addi %r31,%r31,5 +L1: + cmpw %r31,%r30 + blt L0 + + + lwz %r0,lrsave+fsize(%r1) + mtlr %r0 + lwz %r31,-4+fsize(%r1) + lwz %r30,-8+fsize(%r1) + addi %r1,%r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + + +#if 0 +.if 0 +#endif +asm void b_call_imm(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_call_imm: +_b_call_imm: +#endif + + mflr %r0 + stw %r31,-4(%r1) + stw %r30,-8(%r1) + stw %r0,lrsave(%r1) + stwu %r1,-fsize(%r1) + mr %r30,%r3 + li %r31,0 + + b L3 +L2: + bl b_null + bl b_null + bl b_null + bl b_null + bl b_null + + addi %r31,%r31,5 +L3: + cmpw %r31,%r30 + blt L2 + + + lwz %r0,lrsave+fsize(%r1) + mtlr %r0 + lwz %r31,-4+fsize(%r1) + lwz %r30,-8+fsize(%r1) + addi %r1,%r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +#if 0 +.if 0 +#endif +asm void b_add(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_add: +_b_add: +#endif + + mflr %r0 + stw %r31,-4(%r1) + stw %r30,-8(%r1) + stw %r0,lrsave(%r1) + stwu %r1,-fsize(%r1) + mr %r30,%r3 + li %r31,0 + + b L5 +L4: + addi %r3,%r3,5 + addi %r4,%r4,5 + addi %r5,%r5,5 + addi %r6,%r6,5 + addi %r7,%r7,5 + + addi %r3,%r3,5 + addi %r4,%r4,5 + addi %r5,%r5,5 + addi %r6,%r6,5 + addi %r7,%r7,5 + + addi %r31,%r31,10 +L5: + cmpw %r31,%r30 + blt L4 + + + lwz %r0,lrsave+fsize(%r1) + mtlr %r0 + lwz %r31,-4+fsize(%r1) + lwz %r30,-8+fsize(%r1) + addi %r1,%r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif + + + +#if 0 +.if 0 +#endif +asm void b_load(long n) +{ +#if 0 +.endif +#endif + +#if 0 +b_load: +_b_load: +#endif + + mflr %r0 + stw %r31,-4(%r1) + stw %r30,-8(%r1) + stw %r0,lrsave(%r1) + stwu %r1,-fsize(%r1) + mr %r30,%r3 + li %r31,0 + + b L7 +L6: + lwz %r3,4(%r1) + lwz %r4,8(%r1) + lwz %r5,12(%r1) + lwz %r6,16(%r1) + lwz %r7,20(%r1) + + lwz %r3,24(%r1) + lwz %r4,28(%r1) + lwz %r5,32(%r1) + lwz %r6,36(%r1) + lwz %r7,40(%r1) + + + addi %r31,%r31,10 +L7: + cmpw %r31,%r30 + blt L6 + + + lwz %r0,lrsave+fsize(%r1) + mtlr %r0 + lwz %r31,-4+fsize(%r1) + lwz %r30,-8+fsize(%r1) + addi %r1,%r1,fsize + blr + +#if 0 +.if 0 +#endif +} +#if 0 +.endif +#endif diff --git a/ext/systemc/src/sysc/qt/md/pthreads.Makefile b/ext/systemc/src/sysc/qt/md/pthreads.Makefile new file mode 100644 index 000000000..f722fbe19 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/pthreads.Makefile @@ -0,0 +1,108 @@ +# Generated automatically from Makefile.in by configure. +# Makefile.in generated automatically by automake 1.4 from Makefile.am + +# Copyright (C) 1994, 1995-8, 1999 Free Software Foundation, Inc. +# This Makefile.in is free software; the Free Software Foundation +# gives unlimited permission to copy and/or distribute it, +# with or without modifications, as long as this notice is preserved. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY, to the extent permitted by law; without +# even the implied warranty of MERCHANTABILITY or FITNESS FOR A +# PARTICULAR PURPOSE. + + +SHELL = /bin/sh + +all: + +mostlyclean-noinstLIBRARIES: + +clean-noinstLIBRARIES: + +distclean-noinstLIBRARIES: + +maintainer-clean-noinstLIBRARIES: + +mostlyclean-compile: + +clean-compile: + +distclean-compile: + +maintainer-clean-compile: + +tags: + +ID: + +TAGS: + +mostlyclean-tags: + +clean-tags: + +distclean-tags: + +maintainer-clean-tags: + +distdir: + +info-am: +info: +dvi-am: +dvi: dvi-am +check-am: all-am +check: check-am +installcheck-am: +installcheck: installcheck-am +install-exec-am: +install-exec: install-exec-am + +install-data-am: install-data-local +install-data: install-data-am + +install-am: all-am +install: install-am +uninstall-am: uninstall-local +uninstall: uninstall-am +all-am: +all-redirect: +install-strip: +installdirs: + + +mostlyclean-generic: + +clean-generic: + +distclean-generic: + +maintainer-clean-generic: +mostlyclean-am: + +mostlyclean: + +clean-am: + +clean: + +distclean-am: + +distclean: + +maintainer-clean-am: + +maintainer-clean: + +.PHONY: + + +configuration: + +clean: + +install-data-local: + +uninstall-local: + diff --git a/ext/systemc/src/sysc/qt/md/solaris.README b/ext/systemc/src/sysc/qt/md/solaris.README new file mode 100644 index 000000000..04f855c44 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/solaris.README @@ -0,0 +1,19 @@ +Solaris 2.x is like System V (maybe it *is* System V?) and is different +from older versions in that it uses no leading underscore for variable +and function names. That is, the old convention was: + + foo(){} + +got compiled as + + .globl _foo + _foo: + +and is now compiled as + + .globl foo + foo: + +The `config' script should fix up the older (leading underscore) versions +of the machine-dependent files to use the newer (no leading underscore) +calling conventions. diff --git a/ext/systemc/src/sysc/qt/md/sparc.h b/ext/systemc/src/sysc/qt/md/sparc.h new file mode 100644 index 000000000..edaf5325e --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/sparc.h @@ -0,0 +1,140 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_SPARC_H +#define QUICKTHREADS_SPARC_H + +typedef unsigned long qt_word_t; + +/* Stack layout on the sparc: + + non-varargs: + + +--- + | <blank space for alignment> + | %o7 == return address -> qt_start + | %i7 + | %i6 == frame pointer -> 0 (NULL-terminated stack frame chain) + | %i5 -> only + | %i4 -> userf + | %i3 + | %i2 -> pt + | %i1 -> pu + | %i0 + | %l7 + | %l6 + | %l5 + | %l4 + | %l3 + | %l2 + | %l1 + | %l0 <--- qt_t.sp + +--- + + varargs: + + | : + | : + | argument list + | one-word aggregate return pointer + +--- + | <blank space for alignment> + | %o7 == return address -> qt_vstart + | %i7 + | %i6 == frame pointer -> 0 (NULL-terminated stack frame chain) + | %i5 -> startup + | %i4 -> userf + | %i3 -> cleanup + | %i2 -> pt + | %i1 + | %i0 + | %l7 + | %l6 + | %l5 + | %l4 + | %l3 + | %l2 + | %l1 + | %l0 <--- qt_t.sp + +--- + + */ + + +/* What to do to start a thread running. */ +extern void qt_start (void); +extern void qt_vstart (void); + + +/* Hold 17 saved registers + 1 word for alignment. */ +#define QUICKTHREADS_STKBASE (18 * 4) +#define QUICKTHREADS_VSTKBASE QUICKTHREADS_STKBASE + + +/* Stack must be doubleword aligned. */ +#define QUICKTHREADS_STKALIGN (8) /* Doubleword aligned. */ + +#define QUICKTHREADS_ONLY_INDEX (QUICKTHREADS_I5) +#define QUICKTHREADS_USER_INDEX (QUICKTHREADS_I4) +#define QUICKTHREADS_ARGT_INDEX (QUICKTHREADS_I2) +#define QUICKTHREADS_ARGU_INDEX (QUICKTHREADS_I1) + +#define QUICKTHREADS_VSTARTUP_INDEX (QUICKTHREADS_I5) +#define QUICKTHREADS_VUSERF_INDEX (QUICKTHREADS_I4) +#define QUICKTHREADS_VCLEANUP_INDEX (QUICKTHREADS_I3) +#define QUICKTHREADS_VARGT_INDEX (QUICKTHREADS_I2) + +#define QUICKTHREADS_O7 (16) +#define QUICKTHREADS_I6 (14) +#define QUICKTHREADS_I5 (13) +#define QUICKTHREADS_I4 (12) +#define QUICKTHREADS_I3 (11) +#define QUICKTHREADS_I2 (10) +#define QUICKTHREADS_I1 ( 9) + + +/* The thread will ``return'' to the `qt_start' routine to get things + going. The normal return sequence takes us to QUICKTHREADS_O7+8, so we + pre-subtract 8. The frame pointer chain is 0-terminated to prevent + the trap handler from chasing off in to random memory when flushing + stack windows. */ + +#define QUICKTHREADS_ARGS_MD(top) \ + (QUICKTHREADS_SPUT ((top), QUICKTHREADS_O7, ((void *)(((int)qt_start)-8))), \ + QUICKTHREADS_SPUT ((top), QUICKTHREADS_I6, 0)) + + +/* The varargs startup routine always reads 6 words of arguments + (6 argument registers) from the stack, offset by one word to + allow for an aggregate return area pointer. If the varargs + routine actually pushed fewer words than that, qt_vstart could read + off the top of the stack. To prevent errors, we always allocate 8 + words. The space is often just wasted. */ + +#define QUICKTHREADS_VARGS_MD0(sp, vabytes) \ + ((qt_t *)(((char *)(sp)) - 8*4 - QUICKTHREADS_STKROUNDUP(vabytes))) + +#define QUICKTHREADS_VARGS_MD1(sp) \ + (QUICKTHREADS_SPUT (sp, QUICKTHREADS_O7, ((void *)(((int)qt_vstart)-8)))) + +/* The SPARC has wierdo calling conventions which stores a hidden + parameter for returning aggregate values, so the rest of the + parameters are shoved up the stack by one place. */ +#define QUICKTHREADS_VARGS_ADJUST(sp) (((char *)sp)+4) + +#define QUICKTHREADS_VARGS_DEFAULT + + +#define QUICKTHREADS_GROW_DOWN + +#endif /* ndef QUICKTHREADS_SPARC_H */ diff --git a/ext/systemc/src/sysc/qt/md/sparc.s b/ext/systemc/src/sysc/qt/md/sparc.s new file mode 100644 index 000000000..d61236b54 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/sparc.s @@ -0,0 +1,142 @@ +/* sparc.s -- assembly support for the `qt' thread building kit. */ + +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +/* #include <machine/trap.h> */ + + .text + .align 4 + .global _qt_blocki + .global _qt_block + .global _qt_abort + .global _qt_start + .global _qt_vstart + +/* Register assignment: +// %o0: incoming `helper' function to call after cswap +// also used as outgoing sp of old thread (qt_t *) +// %o1, %o2: +// parameters to `helper' function called after cswap +// %o3: sp of new thread +// %o5: tmp used to save old thread sp, while using %o0 +// to call `helper' f() after cswap. +// +// +// Aborting a thread is easy if there are no cached register window +// frames: just switch to the new stack and away we go. If there are +// cached register window frames they must all be written back to the +// old stack before we move to the new stack. If we fail to do the +// writeback then the old stack memory can be written with register +// window contents e.g., after the stack memory has been freed and +// reused. +// +// If you don't believe this, try setting the frame pointer to zero +// once we're on the new stack. This will not affect correctnes +// otherwise because the frame pointer will eventually get reloaded w/ +// the new thread's frame pointer. But it will be zero briefly before +// the reload. You will eventually (100,000 cswaps later on a small +// SPARC machine that I tried) get an illegal instruction trap from +// the kernel trying to flush a cached window to location 0x0. +// +// Solution: flush windows before switching stacks, which invalidates +// all the other register windows. We could do the trap +// conditionally: if we're in the lowest frame of a thread, the fp is +// zero already so we know there's nothing cached. But we expect most +// aborts will be done from a first function that does a `save', so we +// will rarely save anything and always pay the cost of testing to see +// if we should flush. +// +// All floating-point registers are caller-save, so this routine +// doesn't need to do anything to save and restore them. +// +// `qt_block' and `qt_blocki' return the same value as the value +// returned by the helper function. We get this ``for free'' +// since we don't touch the return value register between the +// return from the helper function and return from qt_block{,i}. +*/ + +_qt_block: +_qt_blocki: + sub %sp, 8, %sp /* Allocate save area for return pc. */ + st %o7, [%sp+64] /* Save return pc. */ +_qt_abort: + ta 0x03 /* Save locals and ins. */ + mov %sp, %o5 /* Remember old sp w/o chng ins/locals. */ + sub %o3, 96, %sp /* Allocate kwsa, switch stacks. */ + call %o0, 0 /* Call `helper' routine. */ + mov %o5, %o0 /* Pass old thread to qt_after_t() */ + /* .. along w/ args in %o1 & %o2. */ + + /* Restore callee-save regs. The kwsa + // is on this stack, so offset all + // loads by sizeof(kwsa), 64 bytes. + */ + ldd [%sp+ 0+96], %l0 + ldd [%sp+ 8+96], %l2 + ldd [%sp+16+96], %l4 + ldd [%sp+24+96], %l6 + ldd [%sp+32+96], %i0 + ldd [%sp+40+96], %i2 + ldd [%sp+48+96], %i4 + ldd [%sp+56+96], %i6 + ld [%sp+64+96], %o7 /* Restore return pc. */ + + retl /* Return to address in %o7. */ + add %sp, 104, %sp /* Deallocate kwsa, ret pc area. */ + + +/* The function calling conventions say there has to be a 1-word area +// in the caller's stack to hold a pointer to space for aggregate +// return values. It also says there should be a 6-word area to hold +// %o0..%o5 if the callee wants to save them (why? I don't know...) +// Round up to 8 words to maintain alignment. +// +// Parameter values were stored in callee-save regs and are moved to +// the parameter registers. +*/ +_qt_start: + mov %i1, %o0 /* `pu': Set up args to `only'. */ + mov %i2, %o1 /* `pt'. */ + mov %i4, %o2 /* `userf'. */ + call %i5, 0 /* Call client function. */ + sub %sp, 32, %sp /* Allocate 6-word callee space. */ + + call _qt_error, 0 /* `only' erroniously returned. */ + nop + + +/* Same comments as `_qt_start' about allocating rounded-up 7-word +// save areas. */ + +_qt_vstart: + sub %sp, 32, %sp /* Allocate 7-word callee space. */ + call %i5, 0 /* call `startup'. */ + mov %i2, %o0 /* .. with argument `pt'. */ + + add %sp, 32, %sp /* Use 7-word space in varargs. */ + ld [%sp+ 4+64], %o0 /* Load arg0 ... */ + ld [%sp+ 8+64], %o1 + ld [%sp+12+64], %o2 + ld [%sp+16+64], %o3 + ld [%sp+20+64], %o4 + call %i4, 0 /* Call `userf'. */ + ld [%sp+24+64], %o5 + + /* Use 6-word space in varargs. */ + mov %o0, %o1 /* Pass return value from userf */ + call %i3, 0 /* .. when call `cleanup. */ + mov %i2, %o0 /* .. along with argument `pt'. */ + + call _qt_error, 0 /* `cleanup' erroniously returned. */ + nop diff --git a/ext/systemc/src/sysc/qt/md/sparc_b.s b/ext/systemc/src/sysc/qt/md/sparc_b.s new file mode 100644 index 000000000..cd26672d7 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/sparc_b.s @@ -0,0 +1,106 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .globl _b_call_reg + .globl _b_call_imm + .globl _b_add + .globl _b_load + +_b_null: + retl + nop + +_b_call_reg: + sethi %hi(_b_null),%o4 + or %o4,%lo(_b_null),%o4 + add %o7,%g0, %o3 +L0: + call %o4 + nop + call %o4 + nop + call %o4 + nop + call %o4 + nop + call %o4 + nop + + subcc %o0,1,%o0 + bg L0 + nop + add %o3,%g0, %o7 + retl + nop + +_b_call_imm: + sethi %hi(_b_null),%o4 + or %o4,%lo(_b_null),%o4 + add %o7,%g0, %o3 +L1: + call _b_null + call _b_null + call _b_null + call _b_null + call _b_null + + subcc %o0,1,%o0 + bg L0 + nop + add %o3,%g0, %o7 + retl + nop + + +_b_add: + add %o0,%g0,%o1 + add %o0,%g0,%o2 + add %o0,%g0,%o3 + add %o0,%g0,%o4 +L2: + sub %o0,5,%o0 + sub %o1,5,%o1 + sub %o2,5,%o2 + sub %o3,5,%o3 + sub %o4,5,%o4 + + subcc %o0,5,%o0 + sub %o1,5,%o1 + sub %o2,5,%o2 + sub %o3,5,%o3 + sub %o4,5,%o4 + + bg L2 + nop + retl + nop + + +_b_load: + ld [%sp+ 0], %g0 +L3: + ld [%sp+ 4],%g0 + ld [%sp+ 8],%g0 + ld [%sp+12],%g0 + ld [%sp+16],%g0 + ld [%sp+20],%g0 + ld [%sp+24],%g0 + ld [%sp+28],%g0 + ld [%sp+32],%g0 + ld [%sp+36],%g0 + + subcc %o0,10,%o0 + bg L3 + ld [%sp+ 0],%g0 + retl + nop diff --git a/ext/systemc/src/sysc/qt/md/vax.h b/ext/systemc/src/sysc/qt/md/vax.h new file mode 100644 index 000000000..1948c6fbd --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/vax.h @@ -0,0 +1,130 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + +#ifndef QUICKTHREADS_VAX_H +#define QUICKTHREADS_VAX_H + +typedef unsigned long qt_word_t; + +/* Thread's initial stack layout on the VAX: + + non-varargs: + + +--- + | arg[2] === `userf' on startup + | arg[1] === `pt' on startup + | arg[0] === `pu' on startup + | ... === `only' on startup. + +--- + | ret pc === `qt_start' on startup + | fp === 0 on startup + | ap === 0 on startup + | <mask> + | 0 (handler) <--- qt_t.sp + +--- + + When a non-varargs thread is started, it ``returns'' to the start + routine, which calls the client's `only' function. + + The varargs case is clearly bad code. The various values should be + stored in a save area and snarfed in to callee-save registers on + startup. However, it's too painful to figure out the register + mask (right now), so do it the slow way. + + +--- + | arg[n-1] + | .. + | arg[0] + | nargs + +--- + | === `cleanup' + | === `vuserf' + | === `startup' + | === `pt' + +--- + | ret pc === `qt_start' on startup + | fp === 0 on startup + | ap === 0 on startup + | <mask> + | 0 (handler) <--- qt_t.sp + +--- + + When a varargs thread is started, it ``returns'' to the `qt_vstart' + startup code. The startup code pops all the extra arguments, then + calls the appropriate functions. */ + + +/* What to do to start a thread running. */ +extern void qt_start (void); +extern void qt_vstart (void); + + +/* Initial call frame for non-varargs and varargs cases. */ +#define QUICKTHREADS_STKBASE (10 * 4) +#define QUICKTHREADS_VSTKBASE (9 * 4) + + +/* Stack "must be" 4-byte aligned. (Actually, no, but it's + easiest and probably fastest to do so.) */ + +#define QUICKTHREADS_STKALIGN (4) + + +/* Where to place various arguments. */ +#define QUICKTHREADS_ONLY_INDEX (5) +#define QUICKTHREADS_USER_INDEX (8) +#define QUICKTHREADS_ARGT_INDEX (7) +#define QUICKTHREADS_ARGU_INDEX (6) + +#define QUICKTHREADS_VSTARTUP_INDEX (6) +#define QUICKTHREADS_VUSERF_INDEX (7) +#define QUICKTHREADS_VCLEANUP_INDEX (8) +#define QUICKTHREADS_VARGT_INDEX (5) + + +/* Stack grows down. The top of the stack is the first thing to + pop off (predecrement, postincrement). */ +#define QUICKTHREADS_GROW_DOWN + + +extern void qt_error (void); + +#define QUICKTHREADS_VAX_GMASK_NOREGS (0) + +/* Push on the error return address, null termination to call chains, + number of arguments to `only', register save mask (save no + registers). */ + +#define QUICKTHREADS_ARGS_MD(sto) \ + (QUICKTHREADS_SPUT (sto, 0, 0), \ + QUICKTHREADS_SPUT (sto, 1, QUICKTHREADS_VAX_GMASK_NOREGS), \ + QUICKTHREADS_SPUT (sto, 2, 0), \ + QUICKTHREADS_SPUT (sto, 3, 0), \ + QUICKTHREADS_SPUT (sto, 4, qt_start)) + +#define QUICKTHREADS_VARGS_MD0(sto, nbytes) \ + (QUICKTHREADS_SPUT (sto, (-(nbytes)/4)-1, (nbytes)/4), \ + ((char *)(((sto)-4) - QUICKTHREADS_STKROUNDUP(nbytes)))) + +#define QUICKTHREADS_VARGS_ADJUST(sp) ((char *)sp + 4) + +#define QUICKTHREADS_VARGS_MD1(sto) \ + (QUICKTHREADS_SPUT (sto, 0, 0), \ + QUICKTHREADS_SPUT (sto, 1, QUICKTHREADS_VAX_GMASK_NOREGS), \ + QUICKTHREADS_SPUT (sto, 2, 0), \ + QUICKTHREADS_SPUT (sto, 3, 0), \ + QUICKTHREADS_SPUT (sto, 4, qt_vstart)) + +#define QUICKTHREADS_VARGS_DEFAULT + +#endif /* QUICKTHREADS_VAX_H */ diff --git a/ext/systemc/src/sysc/qt/md/vax.s b/ext/systemc/src/sysc/qt/md/vax.s new file mode 100644 index 000000000..fed03f043 --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/vax.s @@ -0,0 +1,69 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .text + + .globl _qt_abort + .globl _qt_block + .globl _qt_blocki + .globl _qt_start + .globl _qt_vstart + + +/* +// Calls to these routines have the signature +// +// void *block (func, arg1, arg2, newsp) +// +// Since the prologue saves 5 registers, nargs, pc, fp, ap, mask, and +// a condition handler (at sp+0), the first argument is 40=4*10 bytes +// offset from the stack pointer. +*/ +_qt_block: +_qt_blocki: +_qt_abort: + .word 0x7c0 /* Callee-save mask: 5 registers. */ + movl 56(sp),r1 /* Get stack pointer of new thread. */ + movl 52(sp),-(r1) /* Push arg2 */ + movl 48(sp),-(r1) /* Push arg1 */ + movl sp,-(r1) /* Push arg0 */ + + movl 44(sp),r0 /* Get helper to call. */ + movl r1,sp /* Move to new thread's stack. */ + addl3 sp,$12,fp /* .. including the frame pointer. */ + calls $3,(r0) /* Call helper. */ + + ret + +_qt_start: + movl (sp)+,r0 /* Get `only'. */ + calls $3,(r0) /* Call `only'. */ + calls $0,_qt_error /* `only' erroniously returned. */ + + +_qt_vstart: + movl (sp)+,r10 /* Get `pt'. */ + movl (sp)+,r9 /* Get `startup'. */ + movl (sp)+,r8 /* Get `vuserf'. */ + movl (sp)+,r7 /* Get `cleanup'. */ + + pushl r10 /* Push `qt'. */ + calls $1,(r9) /* Call `startup', pop `qt' on return. */ + + calls (sp)+,(r8) /* Call user's function. */ + + pushl r0 /* Push `vuserf_retval'. */ + pushl r10 /* Push `qt'. */ + calls $2,(r7) /* Call `cleanup', never return. */ + + calls $0,_qt_error /* `cleanup' erroniously returned. */ diff --git a/ext/systemc/src/sysc/qt/md/vax_b.s b/ext/systemc/src/sysc/qt/md/vax_b.s new file mode 100644 index 000000000..2db2d4fec --- /dev/null +++ b/ext/systemc/src/sysc/qt/md/vax_b.s @@ -0,0 +1,92 @@ +/* + * QuickThreads -- Threads-building toolkit. + * Copyright (c) 1993 by David Keppel + * + * Permission to use, copy, modify and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that the above copyright notice and this notice + * appear in all copies. This software is provided as a + * proof-of-concept and for demonstration purposes; there is no + * representation about the suitability of this software for any + * purpose. + */ + + .text + .globl _b_call_reg + .globl _b_call_imm + .globl _b_add + .globl _b_load + +_b_null: + .word 0x0 + ret + +_b_call_reg: + .word 0x0 + movl 4(ap),r0 + moval _b_null,r1 +L0: + calls $0,(r1) + calls $0,(r1) + calls $0,(r1) + calls $0,(r1) + calls $0,(r1) + + subl2 $5,r0 + bgtr L0 + ret + + +_b_call_imm: + .word 0x0 + movl 4(ap),r0 +L1: + calls $0,_b_null + calls $0,_b_null + calls $0,_b_null + calls $0,_b_null + calls $0,_b_null + + subl2 $5,r0 + bgtr L1 + ret + + +_b_add: + .word 0x0 + movl 4(ap),r0 +L2: + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + subl2 $1,r0 + + bgtr L2 + ret + + +_b_load: + .word 0x0 + movl 4(ap),r0 +L3: + movl 0(sp),r1 + movl 4(sp),r1 + movl 8(sp),r1 + movl 12(sp),r1 + movl 16(sp),r1 + movl 20(sp),r1 + movl 24(sp),r1 + movl 28(sp),r1 + movl 32(sp),r1 + movl 36(sp),r1 + + subl2 $1,r0 + bgtr L3 + ret |