source: Sophya/trunk/SophyaProg/Tests/tparlex.cc@ 3826

Last change on this file since 3826 was 3730, checked in by cmv, 16 years ago

strcmp a besoin de <string.h>, cmv 06/01/2020

File size: 7.1 KB
RevLine 
[3721]1#include <stdlib.h>
2#include <stdio.h>
[3730]3#include <string.h>
[3721]4#include <time.h>
5#include <unistd.h>
6
7#include <iostream>
8#include <vector>
9
10#include "sopnamsp.h"
11#include "tmatrix.h"
12#include "tvector.h"
13#include "matharr.h"
14#include "tarrinit.h"
15#include "randr48.h"
16
17#include "parlex.h"
18#include "resusage.h"
19#include "timing.h"
20#include "ctimer.h"
21
22
23/* -------------------------------------------------------------
24 Programme de test des classes d'execution parallele de SOPHYA
25 SOPHYA::ParallelExecutor ...
26 Exemples d'execution:
27 Usage: tparlex SEL [Size=500] [NThreads=2] [NbExecuteCall=1]
28 csh> time tparlex A 2000 2
29 csh> time tparlex B 500 2
30 csh> time tparlex A 2000 2 4
31 csh> time tparlex B 500 2 3
32*/
33
34// Declaration des fonctions de test
35int parex_testA();
36int parex_testB();
37
38
39static sa_size_t SIZE = 500;
40static unsigned int NTHR = 2;
41static unsigned int NBPEXC = 1;
42
43//--------------------------------------------------------------
44//---------------------- MAIN PROGRAM ------------------------
45int main(int narg, char *arg[])
46{
47
48 if ((narg<2)||((narg > 1)&&(strcmp(arg[1],"-h")==0))) {
49 cout << " tparlex Test of SOPHYA parallel execution classes \n"
50 << " Usage: tparlex SEL [Size=500] [NThreads=2] [NbExecuteCall=1] \n"
51 << " - SEL : A or B \n "
52 << " - Size : Matrix size (see below) \n "
53 << " - NThreads : number of threads \n "
54 << " - NbExecuteCall : number of call to parallel execution function \n "
55 << " A -> Sin(mx)+Sqrt(mx)+Cos(mx) , mx(NThr,1000*Size) \n"
56 << " B -> mxa(NThr*Size, Size) * mxb(Size,Size) " << endl;
57 return(1);
58 }
59 InitTim();
60 ResourceUsage res(ResourceUsage::RU_All);
61
62 char sel = *arg[1];
63 if (narg > 2) SIZE = atol(arg[2]);
64 if (narg > 3) NTHR = atoi(arg[3]);
65 if (narg > 4) NBPEXC = atoi(arg[4]);
66 if (SIZE<100) SIZE=100;
67 if (NTHR<1) NTHR=1;
68 if (NBPEXC<1) NBPEXC=1;
69
70 cout << " tparlex/starting, SEL=" << sel << " Size=" << SIZE << " NTHR=NRows=" << NTHR
71 << " NbParExCall=" << NBPEXC << endl;
72 BaseArray::SetDefaultMemoryMapping(BaseArray::CMemoryMapping);
73
74 int rc = 0;
75 try {
76 ResourceUsage res(ResourceUsage::RU_All);
77 if (sel=='A') rc = parex_testA();
78 else rc = parex_testB();
79 cout << res;
80 }
81 catch (std::exception exc) {
82 cerr << "tparlex: catched std::exception " << exc.what() << endl;
83 rc = 77;
84 }
85 catch (...) {
86 cerr << "tparlex: catched unknown (...) exception " << endl;
87 rc = 78;
88 }
89
90 PrtTim(">>> tparlex: END <<< ");
91 cout << " ------------ End execution tparlex -------------- " << endl;
92 return(rc);
93}
94
95
96//--------------------------------------------------------------------
97// Classe implementant la fonction d'execution parallele
98// ParallelTaskInterface::execute() mxb=sin(mxa)+sqrt(mxa)+cos(mxa)
99class TParTaskA : public ParallelTaskInterface {
100public:
101 TParTaskA(Matrix& a, Matrix& b)
102 : mxa(a), mxb(b), nbex(0)
103 {
104 }
105 virtual int execute(int tid)
106 {
107 nbex++;
108 cout << " ---- TParTaskA::execute(tid=" << tid << ") Start computing - NbExec= " << nbex << endl;
109 Vector vx = mxa.Row(tid);
110 r_8* x = vx.Data();
111 r_8* y = mxb.Row(tid).Data();
112 for(sa_size_t j=0; j<vx.Size(); j++)
113 y[j] = sin(x[j])+sqrt(x[j])+cos(x[j]);
114 // mxb.Row(tid) = Sin(x)+Sqrt(x)+Cos(x);
115 cout << " ---- TParTaskA::execute( " << tid << "," << nbex << ") DONE " << endl;
116 return 0;
117 }
118
119 Matrix& mxa;
120 Matrix& mxb;
121 int nbex;
122};
123
124/* --Fonction-- */
125int parex_testA()
126{
127 sa_size_t NCOLS = SIZE*1000;
128 Matrix a(NTHR, NCOLS);
129 Matrix b(NTHR, NCOLS);
130 Matrix c(NTHR, NCOLS);
131
132 cout << " parex_testA/Info: " << a.InfoString() << endl;
133 a = RegularSequence(0.25,0.003);
134 PrtTim("tparlexA[1] Done init ");
135 cout << "tparlexA[1] Start b=Sin(a)+Sqrt(a)+Cos[a]" << endl;
136 r_8* x = a.Data();
137 r_8* y = b.Data();
138 for(sa_size_t j=0; j<a.Size(); j++)
139 y[j] = sin(x[j])+sqrt(x[j])+cos(x[j]);
140 // b = Sin(a)+Sqrt(a)+Cos(a);
141 PrtTim(">>tparlexA[1.b] Done ");
142 // char ans[64];
143 // cout << " A/ CR to continue ... " << endl; gets(ans);
144
145 TParTaskA ptask(a,c);
146 ParallelExecutor pex(ptask, NTHR);
147 pex.start();
148 int rce=0;
149 for(int i=0; i<NBPEXC; i++) {
150 cout << " tparlexA[II=" << i+1 << " Start ParallelExecution c=Sin(a)+Sqrt(a)+Cos[a]" << endl;
151 rce = pex.execute();
152 PrtTim(">>>>tparlexA: End ParallelExecution ");
153 }
154 cout << " Rc=pex.execute() = " << rce << endl;
155 Matrix d = b-c;
156 double dmin, dmax;
157 d.MinMax(dmin, dmax);
158 cout << ">>tparlexA[3] Diff d=b-c, dmin=" << dmin << " dmax=" << dmax << endl;
159 // cout << " B/ CR to continue ... " << endl; gets(ans);
160
161 // cout << " C/ CR to continue ... " << endl; gets(ans);
162 return 0;
163}
164
165
166//--------------------------------------------------------------------
167// Classe implementant la fonction d'execution parallele
168// ParallelTaskInterface::execute() mxc= mxa * mxb
169class TParTaskB : public ParallelTaskInterface {
170public:
171 TParTaskB(Matrix& a, Matrix& b, Matrix& c, int nth)
[3730]172 : mxa(a), mxb(b), mxc(c), nthread(nth), nbex(0)
[3721]173 {
174 }
175 virtual int execute(int tid)
176 {
177 nbex++;
178 cout << " ---- TParTaskB::execute(tid=" << tid << ") Start computing - NbExec= " << nbex << endl;
179 sa_size_t sz = mxb.NRows();
180 // On s'arrange pour que chaque thread calcule une partie de la matrice resultat
181 // Il faut etre un peu malin et eviter que differents threads accedent les memes zones memoire
182 mxc.SubMatrix(Range(sz*tid, sz*(tid+1)-1), Range::all() ) =
183 mxa.SubMatrix(Range(sz*tid, sz*(tid+1)-1), Range::all()) * mxb;
184 /* Une maniere plus compliquee pour MxA(NTH*SZ , SZ) * MxB(SZ, NTH*SZ)
185 mais cela n'apporte rien ...
186 for(sa_size_t j=0; j<nthread; j++) {
187 sa_size_t jj = (j+tid)%nthread;
188 mxc.SubMatrix(Range(sz*tid, sz*(tid+1)-1), Range(sz*jj, sz*(jj+1)-1)) =
189 mxa.SubMatrix(Range(sz*tid, sz*(tid+1)-1), Range::all()) *
190 mxb.SubMatrix(Range::all(), Range(sz*jj, sz*(jj+1)-1));
191 }
192 */
193 cout << " ---- TParTaskB::execute( " << tid << "," << nbex << ") DONE " << endl;
194 return 0;
195 }
196
197 Matrix& mxa;
198 Matrix& mxb;
199 Matrix& mxc;
200 int nthread;
201 int nbex;
202};
203
204/* --Fonction-- */
205int parex_testB()
206{
207 // On se met dans les conditions optimales pour la multiplication matricielle
208 Matrix a(NTHR*SIZE, SIZE, BaseArray::CMemoryMapping);
209 Matrix b(SIZE, SIZE, BaseArray::FortranMemoryMapping);
210 Matrix c(NTHR*SIZE, SIZE);
211
212 cout << " parex_testB/Info: a.InfoString(): " << a.InfoString() << endl;
213 cout << " parex_testB/Info: b.InfoString(): " << b.InfoString() << endl;
214
215 a = RegularSequence(0.25,0.003);
216 b = RegularSequence(1.2,0.0423);
217
218 PrtTim("tparlexA[1] Done init ");
219
220 cout << "tparlexB[1] Start cc=a*b" << endl;
221 // Matrix cc(NTHR*SIZE, SIZE);
222 // cc = a*b;
223 Matrix cc = a*b;
224 PrtTim(">>tparlexB[1.b] Done ");
225
226 TParTaskB ptask(a,b,c,NTHR);
227 ParallelExecutor pex(ptask, NTHR);
228 pex.start();
229 int rce=0;
230 for(int i=0; i<NBPEXC; i++) {
231 cout << " tparlexB[II=" << i+1 << " Start ParallelExecution c=a*b" << endl;
232 rce = pex.execute();
233 PrtTim(">>tparlexB: End ParallelExecution ");
234 }
235 cout << " Rc=pex.execute() = " << rce << endl;
236 Matrix d = cc-c;
237 double dmin, dmax;
238 d.MinMax(dmin, dmax);
239 cout << ">>tparlexB[3] Diff d=b-c, dmin=" << dmin << " dmax=" << dmax << endl;
240 return 0;
241}
Note: See TracBrowser for help on using the repository browser.