ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/cebix/SheepShaver/src/Unix/sysdeps.h
Revision: 1.54
Committed: 2006-07-06T00:01:04Z (17 years, 10 months ago) by gbeauche
Content type: text/plain
Branch: MAIN
Changes since 1.53: +1 -1 lines
Log Message:
Add more micro asm optimisations to x86{,-64} (mulhw, mulhwu, slw, srw, cntlzw
and subf* series). Also now enable the optimzations on x86_64 by default.

File Contents

# User Rev Content
1 cebix 1.1 /*
2     * sysdeps.h - System dependent definitions for Linux
3     *
4 gbeauche 1.36 * SheepShaver (C) 1997-2005 Christian Bauer and Marc Hellwig
5 cebix 1.1 *
6     * This program is free software; you can redistribute it and/or modify
7     * it under the terms of the GNU General Public License as published by
8     * the Free Software Foundation; either version 2 of the License, or
9     * (at your option) any later version.
10     *
11     * This program is distributed in the hope that it will be useful,
12     * but WITHOUT ANY WARRANTY; without even the implied warranty of
13     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14     * GNU General Public License for more details.
15     *
16     * You should have received a copy of the GNU General Public License
17     * along with this program; if not, write to the Free Software
18     * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19     */
20    
21     #ifndef SYSDEPS_H
22     #define SYSDEPS_H
23    
24     #ifndef __STDC__
25     #error "Your compiler is not ANSI. Get a real one."
26     #endif
27    
28     #include "config.h"
29     #include "user_strings_unix.h"
30    
31     #ifndef STDC_HEADERS
32     #error "You don't have ANSI C header files."
33     #endif
34    
35     #ifdef HAVE_UNISTD_H
36     # include <sys/types.h>
37     # include <unistd.h>
38     #endif
39    
40     #include <netinet/in.h>
41     #include <assert.h>
42     #include <stdio.h>
43     #include <stdlib.h>
44 gbeauche 1.37 #include <stddef.h>
45 cebix 1.1 #include <string.h>
46     #include <signal.h>
47    
48 gbeauche 1.24 #ifdef HAVE_PTHREADS
49     # include <pthread.h>
50     #endif
51    
52 cebix 1.1 #ifdef HAVE_FCNTL_H
53     # include <fcntl.h>
54     #endif
55    
56     #ifdef TIME_WITH_SYS_TIME
57     # include <sys/time.h>
58     # include <time.h>
59     #else
60     # ifdef HAVE_SYS_TIME_H
61     # include <sys/time.h>
62     # else
63     # include <time.h>
64     # endif
65     #endif
66    
67 gbeauche 1.37 // Fix offsetof() on FreeBSD and GCC >= 3.4
68     #if defined(__FreeBSD__) && defined(__cplusplus)
69     #undef offsetof
70     /* The cast to "char &" below avoids problems with user-defined
71     "operator &", which can appear in a POD type. */
72     #define offsetof(TYPE, MEMBER) \
73     (__offsetof__ (reinterpret_cast <size_t> \
74     (&reinterpret_cast <char &> \
75     (static_cast<TYPE *> (0)->MEMBER))))
76     #endif
77    
78 gbeauche 1.5 // Define for external components
79     #define SHEEPSHAVER 1
80    
81 gbeauche 1.34 // Always use Real Addressing mode on native architectures
82     // Otherwise, use Direct Addressing mode if NATMEM_OFFSET is set
83 gbeauche 1.35 #if !defined(EMULATED_PPC)
84 gbeauche 1.4 #define REAL_ADDRESSING 1
85 gbeauche 1.39 #include "ppc_asm.tmpl"
86 gbeauche 1.35 #elif defined(NATMEM_OFFSET)
87     #define DIRECT_ADDRESSING 1
88 gbeauche 1.34 #else
89 gbeauche 1.35 #define REAL_ADDRESSING 1
90 gbeauche 1.34 #endif
91 gbeauche 1.4
92 gbeauche 1.48 // Always use the complete non-stubs Ethernet driver
93     #define USE_ETHER_FULL_DRIVER 1
94    
95 gbeauche 1.5 #define POWERPC_ROM 1
96    
97     #if EMULATED_PPC
98     // Mac ROM is write protected when banked memory is used
99     #if REAL_ADDRESSING || DIRECT_ADDRESSING
100     # define ROM_IS_WRITE_PROTECTED 0
101     # define USE_SCRATCHMEM_SUBTERFUGE 1
102 cebix 1.1 #else
103 gbeauche 1.5 # define ROM_IS_WRITE_PROTECTED 1
104     #endif
105 gbeauche 1.9 // Configure PowerPC emulator
106 gbeauche 1.29 #define PPC_REENTRANT_JIT 1
107 gbeauche 1.30 #define PPC_CHECK_INTERRUPTS 1
108 gbeauche 1.14 #define PPC_DECODE_CACHE 1
109 gbeauche 1.10 #define PPC_FLIGHT_RECORDER 1
110 gbeauche 1.17 #define PPC_PROFILE_COMPILE_TIME 0
111     #define PPC_PROFILE_GENERIC_CALLS 0
112 gbeauche 1.16 #define KPX_MAX_CPUS 1
113 gbeauche 1.33 #if ENABLE_DYNGEN
114     #define PPC_ENABLE_JIT 1
115     #endif
116 gbeauche 1.54 #if defined(__i386__) || defined(__x86_64__)
117 gbeauche 1.28 #define DYNGEN_ASM_OPTS 1
118     #endif
119 gbeauche 1.5 #else
120     // Mac ROM is write protected
121     #define ROM_IS_WRITE_PROTECTED 1
122     #define USE_SCRATCHMEM_SUBTERFUGE 0
123 cebix 1.1 #endif
124    
125     // Data types
126     typedef unsigned char uint8;
127     typedef signed char int8;
128     #if SIZEOF_SHORT == 2
129     typedef unsigned short uint16;
130     typedef short int16;
131     #elif SIZEOF_INT == 2
132     typedef unsigned int uint16;
133     typedef int int16;
134     #else
135     #error "No 2 byte type, you lose."
136     #endif
137     #if SIZEOF_INT == 4
138     typedef unsigned int uint32;
139     typedef int int32;
140     #elif SIZEOF_LONG == 4
141     typedef unsigned long uint32;
142     typedef long int32;
143     #else
144     #error "No 4 byte type, you lose."
145     #endif
146     #if SIZEOF_LONG == 8
147     typedef unsigned long uint64;
148     typedef long int64;
149 gbeauche 1.3 #define VAL64(a) (a ## l)
150     #define UVAL64(a) (a ## ul)
151 cebix 1.1 #elif SIZEOF_LONG_LONG == 8
152     typedef unsigned long long uint64;
153     typedef long long int64;
154 gbeauche 1.3 #define VAL64(a) (a ## LL)
155     #define UVAL64(a) (a ## uLL)
156 cebix 1.1 #else
157     #error "No 8 byte type, you lose."
158     #endif
159 gbeauche 1.3 #if SIZEOF_VOID_P == 4
160     typedef uint32 uintptr;
161     typedef int32 intptr;
162     #elif SIZEOF_VOID_P == 8
163     typedef uint64 uintptr;
164     typedef int64 intptr;
165     #else
166     #error "Unsupported size of pointer"
167 gbeauche 1.5 #endif
168    
169 gbeauche 1.53 // Define if the host processor supports fast unaligned load/stores
170     #if defined __i386__ || defined __x86_64__
171     #define UNALIGNED_PROFITABLE 1
172     #endif
173    
174    
175 gbeauche 1.15 /**
176     * Helper functions to byteswap data
177     **/
178    
179     #if defined(__GNUC__)
180 gbeauche 1.23 #if defined(__x86_64__) || defined(__i386__)
181 gbeauche 1.15 // Linux/AMD64 currently has no asm optimized bswap_32() in <byteswap.h>
182     #define opt_bswap_32 do_opt_bswap_32
183     static inline uint32 do_opt_bswap_32(uint32 x)
184     {
185     uint32 v;
186     __asm__ __volatile__ ("bswap %0" : "=r" (v) : "0" (x));
187     return v;
188     }
189     #endif
190     #endif
191    
192 gbeauche 1.5 #ifdef HAVE_BYTESWAP_H
193     #include <byteswap.h>
194     #endif
195    
196 gbeauche 1.15 #ifdef opt_bswap_16
197     #undef bswap_16
198     #define bswap_16 opt_bswap_16
199     #endif
200 gbeauche 1.5 #ifndef bswap_16
201     #define bswap_16 generic_bswap_16
202     #endif
203    
204     static inline uint16 generic_bswap_16(uint16 x)
205     {
206     return ((x & 0xff) << 8) | ((x >> 8) & 0xff);
207     }
208    
209 gbeauche 1.15 #ifdef opt_bswap_32
210     #undef bswap_32
211     #define bswap_32 opt_bswap_32
212     #endif
213 gbeauche 1.5 #ifndef bswap_32
214     #define bswap_32 generic_bswap_32
215     #endif
216    
217     static inline uint32 generic_bswap_32(uint32 x)
218     {
219     return (((x & 0xff000000) >> 24) |
220     ((x & 0x00ff0000) >> 8) |
221     ((x & 0x0000ff00) << 8) |
222     ((x & 0x000000ff) << 24) );
223     }
224 gbeauche 1.23
225     #if defined(__i386__)
226     #define opt_bswap_64 do_opt_bswap_64
227     static inline uint64 do_opt_bswap_64(uint64 x)
228     {
229     return (bswap_32(x >> 32) | (((uint64)bswap_32((uint32)x)) << 32));
230     }
231     #endif
232 gbeauche 1.5
233 gbeauche 1.15 #ifdef opt_bswap_64
234     #undef bswap_64
235     #define bswap_64 opt_bswap_64
236     #endif
237 gbeauche 1.5 #ifndef bswap_64
238     #define bswap_64 generic_bswap_64
239     #endif
240    
241     static inline uint64 generic_bswap_64(uint64 x)
242     {
243     return (((x & UVAL64(0xff00000000000000)) >> 56) |
244     ((x & UVAL64(0x00ff000000000000)) >> 40) |
245     ((x & UVAL64(0x0000ff0000000000)) >> 24) |
246     ((x & UVAL64(0x000000ff00000000)) >> 8) |
247     ((x & UVAL64(0x00000000ff000000)) << 8) |
248     ((x & UVAL64(0x0000000000ff0000)) << 24) |
249     ((x & UVAL64(0x000000000000ff00)) << 40) |
250     ((x & UVAL64(0x00000000000000ff)) << 56) );
251     }
252    
253     #ifdef WORDS_BIGENDIAN
254     static inline uint16 tswap16(uint16 x) { return x; }
255     static inline uint32 tswap32(uint32 x) { return x; }
256     static inline uint64 tswap64(uint64 x) { return x; }
257     #else
258     static inline uint16 tswap16(uint16 x) { return bswap_16(x); }
259     static inline uint32 tswap32(uint32 x) { return bswap_32(x); }
260     static inline uint64 tswap64(uint64 x) { return bswap_64(x); }
261 gbeauche 1.3 #endif
262 cebix 1.1
263 gbeauche 1.6 // spin locks
264     #ifdef __GNUC__
265    
266 gbeauche 1.22 #if defined(__powerpc__) || defined(__ppc__)
267 gbeauche 1.6 #define HAVE_TEST_AND_SET 1
268 gbeauche 1.20 static inline int testandset(volatile int *p)
269 gbeauche 1.6 {
270     int ret;
271 gbeauche 1.22 __asm__ __volatile__("0: lwarx %0,0,%1\n"
272     " xor. %0,%3,%0\n"
273     " bne 1f\n"
274     " stwcx. %2,0,%1\n"
275     " bne- 0b\n"
276 gbeauche 1.6 "1: "
277     : "=&r" (ret)
278     : "r" (p), "r" (1), "r" (0)
279     : "cr0", "memory");
280     return ret;
281     }
282     #endif
283    
284 gbeauche 1.45 #if defined(__i386__) || defined(__x86_64__)
285 gbeauche 1.6 #define HAVE_TEST_AND_SET 1
286 gbeauche 1.20 static inline int testandset(volatile int *p)
287 gbeauche 1.6 {
288 gbeauche 1.31 long int ret;
289 gbeauche 1.20 /* Note: the "xchg" instruction does not need a "lock" prefix */
290 gbeauche 1.31 __asm__ __volatile__("xchgl %k0, %1"
291     : "=r" (ret), "=m" (*p)
292 gbeauche 1.20 : "0" (1), "m" (*p)
293 gbeauche 1.6 : "memory");
294     return ret;
295     }
296     #endif
297    
298     #ifdef __s390__
299     #define HAVE_TEST_AND_SET 1
300 gbeauche 1.20 static inline int testandset(volatile int *p)
301 gbeauche 1.6 {
302     int ret;
303    
304     __asm__ __volatile__("0: cs %0,%1,0(%2)\n"
305     " jl 0b"
306     : "=&d" (ret)
307     : "r" (1), "a" (p), "0" (*p)
308     : "cc", "memory" );
309     return ret;
310     }
311     #endif
312    
313     #ifdef __alpha__
314     #define HAVE_TEST_AND_SET 1
315 gbeauche 1.20 static inline int testandset(volatile int *p)
316 gbeauche 1.6 {
317     int ret;
318     unsigned long one;
319    
320     __asm__ __volatile__("0: mov 1,%2\n"
321     " ldl_l %0,%1\n"
322     " stl_c %2,%1\n"
323     " beq %2,1f\n"
324     ".subsection 2\n"
325     "1: br 0b\n"
326     ".previous"
327     : "=r" (ret), "=m" (*p), "=r" (one)
328     : "m" (*p));
329     return ret;
330     }
331     #endif
332    
333     #ifdef __sparc__
334     #define HAVE_TEST_AND_SET 1
335 gbeauche 1.20 static inline int testandset(volatile int *p)
336 gbeauche 1.6 {
337     int ret;
338    
339     __asm__ __volatile__("ldstub [%1], %0"
340     : "=r" (ret)
341     : "r" (p)
342     : "memory");
343    
344     return (ret ? 1 : 0);
345     }
346     #endif
347    
348     #ifdef __arm__
349     #define HAVE_TEST_AND_SET 1
350 gbeauche 1.20 static inline int testandset(volatile int *p)
351 gbeauche 1.6 {
352     register unsigned int ret;
353     __asm__ __volatile__("swp %0, %1, [%2]"
354     : "=r"(ret)
355     : "0"(1), "r"(p));
356    
357     return ret;
358     }
359     #endif
360    
361     #endif /* __GNUC__ */
362    
363 gbeauche 1.20 typedef volatile int spinlock_t;
364 gbeauche 1.6
365 gbeauche 1.8 static const spinlock_t SPIN_LOCK_UNLOCKED = 0;
366 gbeauche 1.6
367 gbeauche 1.44 #if defined(HAVE_TEST_AND_SET) && defined(HAVE_PTHREADS)
368     // There is nothing to lock if we are not in an multithreaded environment
369 gbeauche 1.32 #define HAVE_SPINLOCKS 1
370 gbeauche 1.6 static inline void spin_lock(spinlock_t *lock)
371     {
372     while (testandset(lock));
373     }
374    
375     static inline void spin_unlock(spinlock_t *lock)
376     {
377     *lock = 0;
378     }
379    
380     static inline int spin_trylock(spinlock_t *lock)
381     {
382     return !testandset(lock);
383     }
384 gbeauche 1.32 #else
385     static inline void spin_lock(spinlock_t *lock)
386     {
387     }
388    
389     static inline void spin_unlock(spinlock_t *lock)
390     {
391     }
392    
393     static inline int spin_trylock(spinlock_t *lock)
394     {
395     return 1;
396     }
397 gbeauche 1.6 #endif
398    
399 cebix 1.1 // Time data type for Time Manager emulation
400     #ifdef HAVE_CLOCK_GETTIME
401     typedef struct timespec tm_time_t;
402     #else
403     typedef struct timeval tm_time_t;
404     #endif
405    
406 gbeauche 1.42 /* Define codes for all the float formats that we know of.
407     * Though we only handle IEEE format. */
408     #define UNKNOWN_FLOAT_FORMAT 0
409     #define IEEE_FLOAT_FORMAT 1
410     #define VAX_FLOAT_FORMAT 2
411     #define IBM_FLOAT_FORMAT 3
412     #define C4X_FLOAT_FORMAT 4
413    
414 gbeauche 1.40 // High-precision timing
415 gbeauche 1.46 #if defined(HAVE_PTHREADS) && defined(HAVE_CLOCK_NANOSLEEP)
416 gbeauche 1.40 #define PRECISE_TIMING 1
417     #define PRECISE_TIMING_POSIX 1
418     #endif
419    
420 gbeauche 1.18 // Timing functions
421     extern uint64 GetTicks_usec(void);
422     extern void Delay_usec(uint32 usec);
423    
424 gbeauche 1.43 #ifdef HAVE_PTHREADS
425 cebix 1.2 // Setup pthread attributes
426     extern void Set_pthread_attr(pthread_attr_t *attr, int priority);
427 gbeauche 1.24 #endif
428 cebix 1.2
429 cebix 1.1 // Various definitions
430     typedef struct rgb_color {
431     uint8 red;
432     uint8 green;
433     uint8 blue;
434     uint8 alpha;
435     } rgb_color;
436    
437 gbeauche 1.19 // X11 display fast locks
438 gbeauche 1.44 #if defined(HAVE_PTHREADS)
439     #define X11_LOCK_TYPE pthread_mutex_t
440     #define X11_LOCK_INIT PTHREAD_MUTEX_INITIALIZER
441     #define XDisplayLock() pthread_mutex_lock(&x_display_lock);
442     #define XDisplayUnlock() pthread_mutex_unlock(&x_display_lock);
443     #elif defined(HAVE_SPINLOCKS)
444 gbeauche 1.19 #define X11_LOCK_TYPE spinlock_t
445     #define X11_LOCK_INIT SPIN_LOCK_UNLOCKED
446     #define XDisplayLock() spin_lock(&x_display_lock)
447     #define XDisplayUnlock() spin_unlock(&x_display_lock)
448     #else
449     #define XDisplayLock()
450     #define XDisplayUnlock()
451     #endif
452     #ifdef X11_LOCK_TYPE
453     extern X11_LOCK_TYPE x_display_lock;
454     #endif
455    
456 cebix 1.1 // Macro for calling MacOS routines
457 gbeauche 1.34 #define CallMacOS(type, tvect) call_macos((uintptr)tvect)
458     #define CallMacOS1(type, tvect, arg1) call_macos1((uintptr)tvect, (uintptr)arg1)
459     #define CallMacOS2(type, tvect, arg1, arg2) call_macos2((uintptr)tvect, (uintptr)arg1, (uintptr)arg2)
460     #define CallMacOS3(type, tvect, arg1, arg2, arg3) call_macos3((uintptr)tvect, (uintptr)arg1, (uintptr)arg2, (uintptr)arg3)
461     #define CallMacOS4(type, tvect, arg1, arg2, arg3, arg4) call_macos4((uintptr)tvect, (uintptr)arg1, (uintptr)arg2, (uintptr)arg3, (uintptr)arg4)
462     #define CallMacOS5(type, tvect, arg1, arg2, arg3, arg4, arg5) call_macos5((uintptr)tvect, (uintptr)arg1, (uintptr)arg2, (uintptr)arg3, (uintptr)arg4, (uintptr)arg5)
463     #define CallMacOS6(type, tvect, arg1, arg2, arg3, arg4, arg5, arg6) call_macos6((uintptr)tvect, (uintptr)arg1, (uintptr)arg2, (uintptr)arg3, (uintptr)arg4, (uintptr)arg5, (uintptr)arg6)
464     #define CallMacOS7(type, tvect, arg1, arg2, arg3, arg4, arg5, arg6, arg7) call_macos7((uintptr)tvect, (uintptr)arg1, (uintptr)arg2, (uintptr)arg3, (uintptr)arg4, (uintptr)arg5, (uintptr)arg6, (uintptr)arg7)
465 cebix 1.1
466 gbeauche 1.3 #ifdef __cplusplus
467     extern "C" {
468     #endif
469     extern uint32 call_macos(uint32 tvect);
470     extern uint32 call_macos1(uint32 tvect, uint32 arg1);
471     extern uint32 call_macos2(uint32 tvect, uint32 arg1, uint32 arg2);
472     extern uint32 call_macos3(uint32 tvect, uint32 arg1, uint32 arg2, uint32 arg3);
473     extern uint32 call_macos4(uint32 tvect, uint32 arg1, uint32 arg2, uint32 arg3, uint32 arg4);
474     extern uint32 call_macos5(uint32 tvect, uint32 arg1, uint32 arg2, uint32 arg3, uint32 arg4, uint32 arg5);
475     extern uint32 call_macos6(uint32 tvect, uint32 arg1, uint32 arg2, uint32 arg3, uint32 arg4, uint32 arg5, uint32 arg6);
476     extern uint32 call_macos7(uint32 tvect, uint32 arg1, uint32 arg2, uint32 arg3, uint32 arg4, uint32 arg5, uint32 arg6, uint32 arg7);
477     #ifdef __cplusplus
478     }
479     #endif
480 cebix 1.1
481     #endif