| [658] | 1 | #ifndef BZ_ARRAYREDUCE_H | 
|---|
|  | 2 | #error <blitz/array/reduce.cc> must be included via <blitz/array/reduce.h> | 
|---|
|  | 3 | #endif | 
|---|
|  | 4 |  | 
|---|
|  | 5 | BZ_NAMESPACE(blitz) | 
|---|
|  | 6 |  | 
|---|
|  | 7 | template<class T_expr, class T_reduction> | 
|---|
|  | 8 | _bz_typename T_reduction::T_resulttype | 
|---|
|  | 9 | _bz_reduceWithIndexTraversal(T_expr expr, T_reduction reduction); | 
|---|
|  | 10 |  | 
|---|
|  | 11 | template<class T_expr, class T_reduction> | 
|---|
|  | 12 | _bz_typename T_reduction::T_resulttype | 
|---|
|  | 13 | _bz_reduceWithStackTraversal(T_expr expr, T_reduction reduction); | 
|---|
|  | 14 |  | 
|---|
|  | 15 | template<class T_expr, class T_reduction> | 
|---|
|  | 16 | _bz_typename T_reduction::T_resulttype | 
|---|
|  | 17 | _bz_ArrayExprFullReduce(T_expr expr, T_reduction reduction) | 
|---|
|  | 18 | { | 
|---|
|  | 19 | #ifdef BZ_TAU_PROFILING | 
|---|
|  | 20 | // Tau profiling code.  Provide Tau with a pretty-printed version of | 
|---|
|  | 21 | // the expression. | 
|---|
|  | 22 | static string exprDescription; | 
|---|
|  | 23 | if (!exprDescription.length())      // faked static initializer | 
|---|
|  | 24 | { | 
|---|
|  | 25 | exprDescription = T_reduction::name(); | 
|---|
|  | 26 | exprDescription += "("; | 
|---|
|  | 27 | prettyPrintFormat format(_bz_true);   // Terse mode on | 
|---|
|  | 28 | expr.prettyPrint(exprDescription, format); | 
|---|
|  | 29 | exprDescription += ")"; | 
|---|
|  | 30 | } | 
|---|
|  | 31 | TAU_PROFILE(" ", exprDescription, TAU_BLITZ); | 
|---|
|  | 32 | #endif // BZ_TAU_PROFILING | 
|---|
|  | 33 |  | 
|---|
|  | 34 | return _bz_reduceWithIndexTraversal(expr, reduction); | 
|---|
|  | 35 |  | 
|---|
|  | 36 | #ifdef NOT_IMPLEMENTED | 
|---|
|  | 37 | if ((T_expr::numIndexPlaceholders > 0) || (T_reduction::needIndex)) | 
|---|
|  | 38 | { | 
|---|
|  | 39 | // The expression involves index placeholders, so have to | 
|---|
|  | 40 | // use index traversal rather than stack traversal. | 
|---|
|  | 41 | return reduceWithIndexTraversal(expr, reduction); | 
|---|
|  | 42 | } | 
|---|
|  | 43 | else { | 
|---|
|  | 44 | // Use a stack traversal | 
|---|
|  | 45 | return reduceWithStackTraversal(expr, reduction); | 
|---|
|  | 46 | } | 
|---|
|  | 47 | #endif | 
|---|
|  | 48 | } | 
|---|
|  | 49 |  | 
|---|
|  | 50 | template<class T_expr, class T_reduction> | 
|---|
|  | 51 | _bz_typename T_reduction::T_resulttype | 
|---|
|  | 52 | _bz_reduceWithIndexTraversal(T_expr expr, T_reduction reduction) | 
|---|
|  | 53 | { | 
|---|
|  | 54 | // This is optimized assuming C-style arrays. | 
|---|
|  | 55 |  | 
|---|
|  | 56 | reduction.reset(); | 
|---|
|  | 57 |  | 
|---|
|  | 58 | const int rank = T_expr::rank; | 
|---|
|  | 59 |  | 
|---|
|  | 60 | TinyVector<int,rank> index, first, last; | 
|---|
|  | 61 |  | 
|---|
|  | 62 | unsigned long count = 1; | 
|---|
|  | 63 |  | 
|---|
|  | 64 | for (int i=0; i < rank; ++i) | 
|---|
|  | 65 | { | 
|---|
|  | 66 | index(i) = expr.lbound(i); | 
|---|
|  | 67 | first(i) = index(i); | 
|---|
|  | 68 | last(i) = expr.ubound(i) + 1; | 
|---|
|  | 69 | count *= last(i) - first(i); | 
|---|
|  | 70 | } | 
|---|
|  | 71 |  | 
|---|
|  | 72 | const int maxRank = rank - 1; | 
|---|
|  | 73 | int lastlbound = expr.lbound(maxRank); | 
|---|
|  | 74 | int lastubound = expr.ubound(maxRank); | 
|---|
|  | 75 |  | 
|---|
|  | 76 | int lastIndex = lastubound + 1; | 
|---|
|  | 77 |  | 
|---|
|  | 78 | _bz_bool loopFlag = _bz_true; | 
|---|
|  | 79 |  | 
|---|
|  | 80 | while(loopFlag) { | 
|---|
|  | 81 | for (index[maxRank] = lastlbound; index[maxRank] < lastIndex; | 
|---|
|  | 82 | ++index[maxRank]) | 
|---|
|  | 83 | { | 
|---|
|  | 84 | if (!reduction(expr(index), index[maxRank])) | 
|---|
|  | 85 | { | 
|---|
|  | 86 | loopFlag = _bz_false; | 
|---|
|  | 87 | break; | 
|---|
|  | 88 | } | 
|---|
|  | 89 | } | 
|---|
|  | 90 |  | 
|---|
|  | 91 | #if 0 | 
|---|
|  | 92 | int j = 1; | 
|---|
|  | 93 | for (; j < rank; ++j) | 
|---|
|  | 94 | { | 
|---|
|  | 95 | index(j-1) = first(j-1); | 
|---|
|  | 96 | ++index(j); | 
|---|
|  | 97 | if (index(j) != last(j)) | 
|---|
|  | 98 | break; | 
|---|
|  | 99 | } | 
|---|
|  | 100 |  | 
|---|
|  | 101 | if (j == rank) | 
|---|
|  | 102 | break; | 
|---|
|  | 103 | #endif | 
|---|
|  | 104 |  | 
|---|
|  | 105 | int j = rank-2; | 
|---|
|  | 106 | for (; j >= 0; --j) | 
|---|
|  | 107 | { | 
|---|
|  | 108 | index(j+1) = first(j+1); | 
|---|
|  | 109 | ++index(j); | 
|---|
|  | 110 | if (index(j) != last(j)) | 
|---|
|  | 111 | break; | 
|---|
|  | 112 | } | 
|---|
|  | 113 |  | 
|---|
|  | 114 | if (j < 0) | 
|---|
|  | 115 | break; | 
|---|
|  | 116 | } | 
|---|
|  | 117 |  | 
|---|
|  | 118 | return reduction.result(count); | 
|---|
|  | 119 | } | 
|---|
|  | 120 |  | 
|---|
|  | 121 | BZ_NAMESPACE_END | 
|---|
|  | 122 |  | 
|---|