source: Sophya/trunk/Poubelle/DPC:FitsIOServer/Blitz/blitz/tuning.h@ 680

Last change on this file since 680 was 658, checked in by ansari, 26 years ago

no message

File size: 3.9 KB
RevLine 
[658]1/***************************************************************************
2 * blitz/tuning.h Platform-specific code tuning
3 *
4 * $Id: tuning.h,v 1.1.1.1 1999-11-26 16:37:05 ansari Exp $
5 *
6 * Copyright (C) 1997,1998 Todd Veldhuizen <tveldhui@seurat.uwaterloo.ca>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version 2
11 * of the License, or (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * Suggestions: blitz-suggest@cybervision.com
19 * Bugs: blitz-bugs@cybervision.com
20 *
21 * For more information, please see the Blitz++ Home Page:
22 * http://seurat.uwaterloo.ca/blitz/
23 *
24 ***************************************************************************
25 * $Log: not supported by cvs2svn $
26 * Revision 1.1.1.1 1999/04/09 17:58:59 ansari
27 * Creation module DPC/Blitz (blitz 0.4) Reza 09/04/99
28 *
29 * Revision 1.6 1998/03/14 00:04:47 tveldhui
30 * 0.2-alpha-05
31 *
32 * Revision 1.5 1997/07/16 14:51:20 tveldhui
33 * Update: Alpha release 0.2 (Arrays)
34 *
35 * Revision 1.4 1997/01/24 14:42:00 tveldhui
36 * Periodic RCS update
37 *
38 * Revision 1.3 1997/01/23 03:28:28 tveldhui
39 * Periodic RCS update
40 *
41 * Revision 1.2 1997/01/13 22:19:58 tveldhui
42 * Periodic RCS update
43 *
44 * Revision 1.1 1996/11/11 17:29:13 tveldhui
45 * Initial revision
46 *
47 *
48 */
49
50#ifndef BZ_TUNING_H
51#define BZ_TUNING_H
52
53// These estimates should be conservative (i.e. underestimate the
54// cache sizes).
55#define BZ_L1_CACHE_ESTIMATED_SIZE 8192
56#define BZ_L2_CACHE_ESTIMATED_SIZE 65536
57
58
59#undef BZ_PARTIAL_LOOP_UNROLL
60#define BZ_PASS_EXPR_BY_VALUE
61#undef BZ_PTR_INC_FASTER_THAN_INDIRECTION
62#define BZ_MANUAL_VECEXPR_COPY_CONSTRUCTOR
63#undef BZ_KCC_COPY_PROPAGATION_KLUDGE
64#undef BZ_ALTERNATE_FORWARD_BACKWARD_TRAVERSALS
65#undef BZ_ARRAY_EXPR_PASS_INDEX_BY_VALUE
66#define BZ_INLINE_GROUP1
67#define BZ_INLINE_GROUP2
68#define BZ_COLLAPSE_LOOPS
69#define BZ_USE_FAST_READ_ARRAY_EXPR
70#define BZ_ARRAY_EXPR_USE_COMMON_STRIDE
71#undef BZ_ARRAY_FAST_TRAVERSAL_UNROLL
72#undef BZ_ARRAY_STACK_TRAVERSAL_CSE_AND_ANTIALIAS
73#undef BZ_ARRAY_STACK_TRAVERSAL_UNROLL
74#define BZ_ARRAY_2D_STENCIL_TILING
75#define BZ_ARRAY_2D_STENCIL_TILE_SIZE 128
76#undef BZ_INTERLACE_ARRAYS
77
78
79/*
80 * Platform-specific tuning
81 */
82
83#ifdef _CRAYT3E
84 // The backend compiler on the T3E does a better job of
85 // loop unrolling.
86 #undef BZ_PARTIAL_LOOP_UNROLL
87 #undef BZ_ARRAY_FAST_TRAVERSAL_UNROLL
88 #undef BZ_ARRAY_STACK_TRAVERSAL_UNROLL
89#endif
90
91#ifdef __GNUC__
92 // The egcs compiler does a good job of loop unrolling, if
93 // -funroll-loops is used.
94 #undef BZ_PARTIAL_LOOP_UNROLL
95 #undef BZ_ARRAY_FAST_TRAVERSAL_UNROLL
96 #undef BZ_ARRAY_STACK_TRAVERSAL_UNROLL
97#endif
98
99#ifdef BZ_DISABLE_KCC_COPY_PROPAGATION_KLUDGE
100 #undef BZ_KCC_COPY_PROPAGATION_KLUDGE
101#endif
102
103#ifdef BZ_INLINE_GROUP1
104 #define _bz_inline1 inline
105#else
106 #define _bz_inline1
107#endif
108
109#ifdef BZ_INLINE_GROUP2
110 #define _bz_inline2 inline
111#else
112 #define _bz_inline2
113#endif
114
115#ifdef __DECCXX
116 // The DEC cxx compiler has problems with loop unrolling
117 // because of aliasing. Loop unrolling and anti-aliasing
118 // is done by Blitz++.
119
120 #define BZ_PARTIAL_LOOP_UNROLL
121 #define BZ_ARRAY_STACK_TRAVERSAL_CSE_AND_ANTIALIAS
122 #define BZ_ARRAY_STACK_TRAVERSAL_UNROLL
123#endif
124
125/*
126 * BZ_NO_PROPAGATE(X) prevents the compiler from performing
127 * copy propagation on a variable. This is used for loop
128 * unrolling to prevent KAI C++ from rearranging the
129 * ordering of memory accesses.
130 */
131
132#define BZ_NO_PROPAGATE(X) X
133
134#ifdef __KCC
135#ifdef BZ_USE_NO_PROPAGATE
136 extern "C" int __kai_apply(const char*, ...);
137
138 #undef BZ_NO_PROPAGATE(X)
139 #define BZ_NO_PROPAGATE(X) __kai_apply("(%a)",&X)
140#endif
141#endif
142
143#endif // BZ_TUNING_H
Note: See TracBrowser for help on using the repository browser.