| [658] | 1 | /***************************************************************************
 | 
|---|
 | 2 |  * blitz/tuning.h      Platform-specific code tuning
 | 
|---|
 | 3 |  *
 | 
|---|
 | 4 |  * $Id: tuning.h,v 1.1.1.1 1999-11-26 16:37:05 ansari Exp $
 | 
|---|
 | 5 |  *
 | 
|---|
 | 6 |  * Copyright (C) 1997,1998 Todd Veldhuizen <tveldhui@seurat.uwaterloo.ca>
 | 
|---|
 | 7 |  *
 | 
|---|
 | 8 |  * This program is free software; you can redistribute it and/or
 | 
|---|
 | 9 |  * modify it under the terms of the GNU General Public License
 | 
|---|
 | 10 |  * as published by the Free Software Foundation; either version 2
 | 
|---|
 | 11 |  * of the License, or (at your option) any later version.
 | 
|---|
 | 12 |  *
 | 
|---|
 | 13 |  * This program is distributed in the hope that it will be useful,
 | 
|---|
 | 14 |  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
|---|
 | 15 |  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
|---|
 | 16 |  * GNU General Public License for more details.
 | 
|---|
 | 17 |  *
 | 
|---|
 | 18 |  * Suggestions:          blitz-suggest@cybervision.com
 | 
|---|
 | 19 |  * Bugs:                 blitz-bugs@cybervision.com
 | 
|---|
 | 20 |  *
 | 
|---|
 | 21 |  * For more information, please see the Blitz++ Home Page:
 | 
|---|
 | 22 |  *    http://seurat.uwaterloo.ca/blitz/
 | 
|---|
 | 23 |  *
 | 
|---|
 | 24 |  ***************************************************************************
 | 
|---|
 | 25 |  * $Log: not supported by cvs2svn $
 | 
|---|
 | 26 |  * Revision 1.1.1.1  1999/04/09  17:58:59  ansari
 | 
|---|
 | 27 |  * Creation module DPC/Blitz (blitz 0.4) Reza 09/04/99
 | 
|---|
 | 28 |  *
 | 
|---|
 | 29 |  * Revision 1.6  1998/03/14 00:04:47  tveldhui
 | 
|---|
 | 30 |  * 0.2-alpha-05
 | 
|---|
 | 31 |  *
 | 
|---|
 | 32 |  * Revision 1.5  1997/07/16 14:51:20  tveldhui
 | 
|---|
 | 33 |  * Update: Alpha release 0.2 (Arrays)
 | 
|---|
 | 34 |  *
 | 
|---|
 | 35 |  * Revision 1.4  1997/01/24 14:42:00  tveldhui
 | 
|---|
 | 36 |  * Periodic RCS update
 | 
|---|
 | 37 |  *
 | 
|---|
 | 38 |  * Revision 1.3  1997/01/23 03:28:28  tveldhui
 | 
|---|
 | 39 |  * Periodic RCS update
 | 
|---|
 | 40 |  *
 | 
|---|
 | 41 |  * Revision 1.2  1997/01/13 22:19:58  tveldhui
 | 
|---|
 | 42 |  * Periodic RCS update
 | 
|---|
 | 43 |  *
 | 
|---|
 | 44 |  * Revision 1.1  1996/11/11 17:29:13  tveldhui
 | 
|---|
 | 45 |  * Initial revision
 | 
|---|
 | 46 |  *
 | 
|---|
 | 47 |  *
 | 
|---|
 | 48 |  */
 | 
|---|
 | 49 | 
 | 
|---|
 | 50 | #ifndef BZ_TUNING_H
 | 
|---|
 | 51 | #define BZ_TUNING_H
 | 
|---|
 | 52 | 
 | 
|---|
 | 53 | // These estimates should be conservative (i.e. underestimate the
 | 
|---|
 | 54 | // cache sizes).
 | 
|---|
 | 55 | #define BZ_L1_CACHE_ESTIMATED_SIZE    8192
 | 
|---|
 | 56 | #define BZ_L2_CACHE_ESTIMATED_SIZE    65536
 | 
|---|
 | 57 | 
 | 
|---|
 | 58 | 
 | 
|---|
 | 59 | #undef  BZ_PARTIAL_LOOP_UNROLL
 | 
|---|
 | 60 | #define BZ_PASS_EXPR_BY_VALUE
 | 
|---|
 | 61 | #undef  BZ_PTR_INC_FASTER_THAN_INDIRECTION
 | 
|---|
 | 62 | #define BZ_MANUAL_VECEXPR_COPY_CONSTRUCTOR
 | 
|---|
 | 63 | #undef  BZ_KCC_COPY_PROPAGATION_KLUDGE
 | 
|---|
 | 64 | #undef  BZ_ALTERNATE_FORWARD_BACKWARD_TRAVERSALS
 | 
|---|
 | 65 | #undef  BZ_ARRAY_EXPR_PASS_INDEX_BY_VALUE
 | 
|---|
 | 66 | #define BZ_INLINE_GROUP1
 | 
|---|
 | 67 | #define BZ_INLINE_GROUP2
 | 
|---|
 | 68 | #define BZ_COLLAPSE_LOOPS
 | 
|---|
 | 69 | #define BZ_USE_FAST_READ_ARRAY_EXPR
 | 
|---|
 | 70 | #define BZ_ARRAY_EXPR_USE_COMMON_STRIDE
 | 
|---|
 | 71 | #undef  BZ_ARRAY_FAST_TRAVERSAL_UNROLL
 | 
|---|
 | 72 | #undef  BZ_ARRAY_STACK_TRAVERSAL_CSE_AND_ANTIALIAS
 | 
|---|
 | 73 | #undef  BZ_ARRAY_STACK_TRAVERSAL_UNROLL
 | 
|---|
 | 74 | #define BZ_ARRAY_2D_STENCIL_TILING
 | 
|---|
 | 75 | #define BZ_ARRAY_2D_STENCIL_TILE_SIZE       128
 | 
|---|
 | 76 | #undef  BZ_INTERLACE_ARRAYS
 | 
|---|
 | 77 | 
 | 
|---|
 | 78 | 
 | 
|---|
 | 79 | /*
 | 
|---|
 | 80 |  * Platform-specific tuning
 | 
|---|
 | 81 |  */
 | 
|---|
 | 82 | 
 | 
|---|
 | 83 | #ifdef _CRAYT3E
 | 
|---|
 | 84 |  // The backend compiler on the T3E does a better job of
 | 
|---|
 | 85 |  // loop unrolling.
 | 
|---|
 | 86 |  #undef BZ_PARTIAL_LOOP_UNROLL
 | 
|---|
 | 87 |  #undef BZ_ARRAY_FAST_TRAVERSAL_UNROLL
 | 
|---|
 | 88 |  #undef BZ_ARRAY_STACK_TRAVERSAL_UNROLL
 | 
|---|
 | 89 | #endif
 | 
|---|
 | 90 | 
 | 
|---|
 | 91 | #ifdef __GNUC__
 | 
|---|
 | 92 |  // The egcs compiler does a good job of loop unrolling, if
 | 
|---|
 | 93 |  // -funroll-loops is used.
 | 
|---|
 | 94 |  #undef BZ_PARTIAL_LOOP_UNROLL
 | 
|---|
 | 95 |  #undef BZ_ARRAY_FAST_TRAVERSAL_UNROLL
 | 
|---|
 | 96 |  #undef BZ_ARRAY_STACK_TRAVERSAL_UNROLL
 | 
|---|
 | 97 | #endif
 | 
|---|
 | 98 | 
 | 
|---|
 | 99 | #ifdef  BZ_DISABLE_KCC_COPY_PROPAGATION_KLUDGE
 | 
|---|
 | 100 |  #undef BZ_KCC_COPY_PROPAGATION_KLUDGE
 | 
|---|
 | 101 | #endif
 | 
|---|
 | 102 | 
 | 
|---|
 | 103 | #ifdef  BZ_INLINE_GROUP1
 | 
|---|
 | 104 |  #define _bz_inline1 inline
 | 
|---|
 | 105 | #else
 | 
|---|
 | 106 |  #define _bz_inline1
 | 
|---|
 | 107 | #endif
 | 
|---|
 | 108 | 
 | 
|---|
 | 109 | #ifdef  BZ_INLINE_GROUP2
 | 
|---|
 | 110 |  #define _bz_inline2 inline
 | 
|---|
 | 111 | #else
 | 
|---|
 | 112 |  #define _bz_inline2
 | 
|---|
 | 113 | #endif
 | 
|---|
 | 114 | 
 | 
|---|
 | 115 | #ifdef __DECCXX
 | 
|---|
 | 116 |  // The DEC cxx compiler has problems with loop unrolling
 | 
|---|
 | 117 |  // because of aliasing.  Loop unrolling and anti-aliasing
 | 
|---|
 | 118 |  // is done by Blitz++.
 | 
|---|
 | 119 | 
 | 
|---|
 | 120 |   #define  BZ_PARTIAL_LOOP_UNROLL
 | 
|---|
 | 121 |   #define  BZ_ARRAY_STACK_TRAVERSAL_CSE_AND_ANTIALIAS
 | 
|---|
 | 122 |   #define  BZ_ARRAY_STACK_TRAVERSAL_UNROLL
 | 
|---|
 | 123 | #endif
 | 
|---|
 | 124 | 
 | 
|---|
 | 125 | /*
 | 
|---|
 | 126 |  * BZ_NO_PROPAGATE(X) prevents the compiler from performing
 | 
|---|
 | 127 |  * copy propagation on a variable.  This is used for loop
 | 
|---|
 | 128 |  * unrolling to prevent KAI C++ from rearranging the
 | 
|---|
 | 129 |  * ordering of memory accesses.
 | 
|---|
 | 130 |  */
 | 
|---|
 | 131 | 
 | 
|---|
 | 132 | #define BZ_NO_PROPAGATE(X)   X
 | 
|---|
 | 133 | 
 | 
|---|
 | 134 | #ifdef __KCC
 | 
|---|
 | 135 | #ifdef BZ_USE_NO_PROPAGATE
 | 
|---|
 | 136 |     extern "C" int __kai_apply(const char*, ...);
 | 
|---|
 | 137 | 
 | 
|---|
 | 138 |     #undef  BZ_NO_PROPAGATE(X)
 | 
|---|
 | 139 |     #define BZ_NO_PROPAGATE(X)  __kai_apply("(%a)",&X)
 | 
|---|
 | 140 | #endif
 | 
|---|
 | 141 | #endif
 | 
|---|
 | 142 | 
 | 
|---|
 | 143 | #endif // BZ_TUNING_H
 | 
|---|