~vcs-imports/escript-finley/trunk

« back to all changes in this revision

Viewing changes to dudley/src/Assemble_PDE_Single2_3D.c

  • Committer: jfenwick
  • Date: 2010-10-11 01:48:14 UTC
  • Revision ID: svn-v4:77569008-7704-0410-b7a0-a92fef0b09fd:trunk:3259
Merging dudley and scons updates from branches

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
 
 
2
/*******************************************************
 
3
*
 
4
* Copyright (c) 2003-2010 by University of Queensland
 
5
* Earth Systems Science Computational Center (ESSCC)
 
6
* http://www.uq.edu.au/esscc
 
7
*
 
8
* Primary Business: Queensland, Australia
 
9
* Licensed under the Open Software License version 3.0
 
10
* http://www.opensource.org/licenses/osl-3.0.php
 
11
*
 
12
*******************************************************/
 
13
 
 
14
/**************************************************************/
 
15
 
 
16
/*    assembles the system of numEq PDEs into the stiffness matrix S right hand side F  */
 
17
/*    the shape functions for test and solution must be identical */
 
18
 
 
19
/*      -(A_{i,j} u_,j)_i-(B_{i} u)_i+C_{j} u_,j-D u_m  and -(X_,i)_i + Y */
 
20
 
 
21
/*    in a 3D domain. The shape functions for test and solution must be identical  */
 
22
/*    and row_NS == row_NN                                                         */
 
23
 
 
24
/*    Shape of the coefficients: */
 
25
 
 
26
/*      A = 3 x 3 */
 
27
/*      B = 3   */
 
28
/*      C = 3   */
 
29
/*      D = scalar  */
 
30
/*      X = 3  */
 
31
/*      Y = scalar   */
 
32
 
 
33
/**************************************************************/
 
34
 
 
35
#include "Assemble.h"
 
36
#include "Util.h"
 
37
#ifdef _OPENMP
 
38
#include <omp.h>
 
39
#endif
 
40
 
 
41
/**************************************************************/
 
42
 
 
43
void Dudley_Assemble_PDE_Single2_3D(Dudley_Assemble_Parameters p, Dudley_ElementFile * elements,
 
44
                                    Paso_SystemMatrix * Mat, escriptDataC * F,
 
45
                                    escriptDataC * A, escriptDataC * B, escriptDataC * C, escriptDataC * D,
 
46
                                    escriptDataC * X, escriptDataC * Y)
 
47
{
 
48
 
 
49
#define DIM 3
 
50
    index_t color;
 
51
    dim_t e;
 
52
    __const double *A_p, *B_p, *C_p, *D_p, *X_p, *Y_p, *A_q, *B_q, *C_q, *D_q, *X_q, *Y_q;
 
53
    double *EM_S, *EM_F, *DSDX;
 
54
    index_t *row_index;
 
55
    register dim_t q, s, r;
 
56
    register double rtmp, rtmp00, rtmp01, rtmp02, rtmp10, rtmp11, rtmp12, rtmp20, rtmp21, rtmp22, rtmp0, rtmp1, rtmp2;
 
57
    bool_t add_EM_F, add_EM_S;
 
58
 
 
59
    bool_t extendedA = isExpanded(A);
 
60
    bool_t extendedB = isExpanded(B);
 
61
    bool_t extendedC = isExpanded(C);
 
62
    bool_t extendedD = isExpanded(D);
 
63
    bool_t extendedX = isExpanded(X);
 
64
    bool_t extendedY = isExpanded(Y);
 
65
    double *F_p = (requireWrite(F), getSampleDataRW(F, 0));     /* use comma, to get around the mixed code and declarations thing */
 
66
    const double *S = p.shapeFns;
 
67
    dim_t len_EM_S = p.numShapes * p.numShapes;
 
68
    dim_t len_EM_F = p.numShapes;
 
69
 
 
70
#pragma omp parallel private(color,EM_S, EM_F, DSDX, A_p, B_p, C_p, D_p, X_p, Y_p, A_q, B_q, C_q, D_q, X_q, Y_q,row_index,q, s,r,rtmp, rtmp00, rtmp01, rtmp02, rtmp10, rtmp11, rtmp12, rtmp20, rtmp21, rtmp22, rtmp0, rtmp1, rtmp2,add_EM_F, add_EM_S)
 
71
    {
 
72
        EM_S = THREAD_MEMALLOC(len_EM_S, double);
 
73
        EM_F = THREAD_MEMALLOC(len_EM_F, double);
 
74
        row_index = THREAD_MEMALLOC(p.numShapes, index_t);
 
75
 
 
76
        if (!Dudley_checkPtr(EM_S) && !Dudley_checkPtr(EM_F) && !Dudley_checkPtr(row_index))
 
77
        {
 
78
 
 
79
            for (color = elements->minColor; color <= elements->maxColor; color++)
 
80
            {
 
81
                /*  open loop over all elements: */
 
82
#pragma omp for private(e) schedule(static)
 
83
                for (e = 0; e < elements->numElements; e++)
 
84
                {
 
85
                    if (elements->Color[e] == color)
 
86
                    {
 
87
                        double vol = p.row_jac->absD[e] * p.row_jac->quadweight;
 
88
 
 
89
                        A_p = getSampleDataRO(A, e);
 
90
                        B_p = getSampleDataRO(B, e);
 
91
                        C_p = getSampleDataRO(C, e);
 
92
                        D_p = getSampleDataRO(D, e);
 
93
                        X_p = getSampleDataRO(X, e);
 
94
                        Y_p = getSampleDataRO(Y, e);
 
95
 
 
96
                        DSDX = &(p.row_jac->DSDX[INDEX5(0, 0, 0, 0, e, p.numShapes, DIM, p.numQuad, 1)]);
 
97
                        for (q = 0; q < len_EM_S; ++q)
 
98
                            EM_S[q] = 0;
 
99
                        for (q = 0; q < len_EM_F; ++q)
 
100
                            EM_F[q] = 0;
 
101
                        add_EM_F = FALSE;
 
102
                        add_EM_S = FALSE;
 
103
 
 
104
                      /**************************************************************/
 
105
                        /*   process A: */
 
106
                      /**************************************************************/
 
107
                        if (NULL != A_p)
 
108
                        {
 
109
                            add_EM_S = TRUE;
 
110
                            if (extendedA)
 
111
                            {
 
112
                                A_q = &(A_p[INDEX4(0, 0, 0, 0, DIM, DIM, p.numQuad)]);
 
113
                                for (s = 0; s < p.numShapes; s++)
 
114
                                {
 
115
                                    for (r = 0; r < p.numShapes; r++)
 
116
                                    {
 
117
                                        rtmp = 0;
 
118
                                        for (q = 0; q < p.numQuad; q++)
 
119
                                        {
 
120
                                            rtmp +=
 
121
                                                vol * (DSDX[INDEX3(s, 0, q, p.numShapes, DIM)] *
 
122
                                                       A_q[INDEX3(0, 0, q, DIM, DIM)] *
 
123
                                                       DSDX[INDEX3(r, 0, q, p.numShapes, DIM)] +
 
124
                                                       DSDX[INDEX3(s, 0, q, p.numShapes, DIM)] *
 
125
                                                       A_q[INDEX3(0, 1, q, DIM, DIM)] *
 
126
                                                       DSDX[INDEX3(r, 1, q, p.numShapes, DIM)] +
 
127
                                                       DSDX[INDEX3(s, 0, q, p.numShapes, DIM)] *
 
128
                                                       A_q[INDEX3(0, 2, q, DIM, DIM)] *
 
129
                                                       DSDX[INDEX3(r, 2, q, p.numShapes, DIM)] +
 
130
                                                       DSDX[INDEX3(s, 1, q, p.numShapes, DIM)] *
 
131
                                                       A_q[INDEX3(1, 0, q, DIM, DIM)] *
 
132
                                                       DSDX[INDEX3(r, 0, q, p.numShapes, DIM)] +
 
133
                                                       DSDX[INDEX3(s, 1, q, p.numShapes, DIM)] *
 
134
                                                       A_q[INDEX3(1, 1, q, DIM, DIM)] *
 
135
                                                       DSDX[INDEX3(r, 1, q, p.numShapes, DIM)] +
 
136
                                                       DSDX[INDEX3(s, 1, q, p.numShapes, DIM)] *
 
137
                                                       A_q[INDEX3(1, 2, q, DIM, DIM)] *
 
138
                                                       DSDX[INDEX3(r, 2, q, p.numShapes, DIM)] +
 
139
                                                       DSDX[INDEX3(s, 2, q, p.numShapes, DIM)] *
 
140
                                                       A_q[INDEX3(2, 0, q, DIM, DIM)] *
 
141
                                                       DSDX[INDEX3(r, 0, q, p.numShapes, DIM)] +
 
142
                                                       DSDX[INDEX3(s, 2, q, p.numShapes, DIM)] *
 
143
                                                       A_q[INDEX3(2, 1, q, DIM, DIM)] *
 
144
                                                       DSDX[INDEX3(r, 1, q, p.numShapes, DIM)] +
 
145
                                                       DSDX[INDEX3(s, 2, q, p.numShapes, DIM)] *
 
146
                                                       A_q[INDEX3(2, 2, q, DIM, DIM)] *
 
147
                                                       DSDX[INDEX3(r, 2, q, p.numShapes, DIM)]);
 
148
                                        }
 
149
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] += rtmp;
 
150
                                    }
 
151
                                }
 
152
                            }
 
153
                            else
 
154
                            {
 
155
                                for (s = 0; s < p.numShapes; s++)
 
156
                                {
 
157
                                    for (r = 0; r < p.numShapes; r++)
 
158
                                    {
 
159
                                        rtmp00 = 0;
 
160
                                        rtmp01 = 0;
 
161
                                        rtmp02 = 0;
 
162
                                        rtmp10 = 0;
 
163
                                        rtmp11 = 0;
 
164
                                        rtmp12 = 0;
 
165
                                        rtmp20 = 0;
 
166
                                        rtmp21 = 0;
 
167
                                        rtmp22 = 0;
 
168
                                        for (q = 0; q < p.numQuad; q++)
 
169
                                        {
 
170
 
 
171
                                            rtmp0 = vol * DSDX[INDEX3(s, 0, q, p.numShapes, DIM)];
 
172
                                            rtmp00 += rtmp0 * DSDX[INDEX3(r, 0, q, p.numShapes, DIM)];
 
173
                                            rtmp01 += rtmp0 * DSDX[INDEX3(r, 1, q, p.numShapes, DIM)];
 
174
                                            rtmp02 += rtmp0 * DSDX[INDEX3(r, 2, q, p.numShapes, DIM)];
 
175
 
 
176
                                            rtmp1 = vol * DSDX[INDEX3(s, 1, q, p.numShapes, DIM)];
 
177
                                            rtmp10 += rtmp1 * DSDX[INDEX3(r, 0, q, p.numShapes, DIM)];
 
178
                                            rtmp11 += rtmp1 * DSDX[INDEX3(r, 1, q, p.numShapes, DIM)];
 
179
                                            rtmp12 += rtmp1 * DSDX[INDEX3(r, 2, q, p.numShapes, DIM)];
 
180
 
 
181
                                            rtmp2 = vol * DSDX[INDEX3(s, 2, q, p.numShapes, DIM)];
 
182
                                            rtmp20 += rtmp2 * DSDX[INDEX3(r, 0, q, p.numShapes, DIM)];
 
183
                                            rtmp21 += rtmp2 * DSDX[INDEX3(r, 1, q, p.numShapes, DIM)];
 
184
                                            rtmp22 += rtmp2 * DSDX[INDEX3(r, 2, q, p.numShapes, DIM)];
 
185
                                        }
 
186
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] +=
 
187
                                            rtmp00 * A_p[INDEX2(0, 0, DIM)] + rtmp01 * A_p[INDEX2(0, 1, DIM)] +
 
188
                                            rtmp02 * A_p[INDEX2(0, 2, DIM)] + rtmp10 * A_p[INDEX2(1, 0, DIM)] +
 
189
                                            rtmp11 * A_p[INDEX2(1, 1, DIM)] + rtmp12 * A_p[INDEX2(1, 2, DIM)] +
 
190
                                            rtmp20 * A_p[INDEX2(2, 0, DIM)] + rtmp21 * A_p[INDEX2(2, 1, DIM)] +
 
191
                                            rtmp22 * A_p[INDEX2(2, 2, DIM)];
 
192
                                    }
 
193
                                }
 
194
                            }
 
195
                        }
 
196
                      /**************************************************************/
 
197
                        /*   process B: */
 
198
                      /**************************************************************/
 
199
                        if (NULL != B_p)
 
200
                        {
 
201
                            add_EM_S = TRUE;
 
202
                            if (extendedB)
 
203
                            {
 
204
                                B_q = &(B_p[INDEX3(0, 0, 0, DIM, p.numQuad)]);
 
205
                                for (s = 0; s < p.numShapes; s++)
 
206
                                {
 
207
                                    for (r = 0; r < p.numShapes; r++)
 
208
                                    {
 
209
                                        rtmp = 0;
 
210
                                        for (q = 0; q < p.numQuad; q++)
 
211
                                        {
 
212
                                            rtmp += vol * S[INDEX2(r, q, p.numShapes)] *
 
213
                                                (DSDX[INDEX3(s, 0, q, p.numShapes, DIM)] *
 
214
                                                 B_q[INDEX2(0, q, DIM)] +
 
215
                                                 DSDX[INDEX3(s, 1, q, p.numShapes, DIM)] *
 
216
                                                 B_q[INDEX2(1, q, DIM)] +
 
217
                                                 DSDX[INDEX3(s, 2, q, p.numShapes, DIM)] * B_q[INDEX2(2, q, DIM)]);
 
218
                                        }
 
219
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] += rtmp;
 
220
                                    }
 
221
                                }
 
222
                            }
 
223
                            else
 
224
                            {
 
225
                                for (s = 0; s < p.numShapes; s++)
 
226
                                {
 
227
                                    for (r = 0; r < p.numShapes; r++)
 
228
                                    {
 
229
                                        rtmp0 = 0;
 
230
                                        rtmp1 = 0;
 
231
                                        rtmp2 = 0;
 
232
                                        for (q = 0; q < p.numQuad; q++)
 
233
                                        {
 
234
                                            rtmp = vol * S[INDEX2(r, q, p.numShapes)];
 
235
                                            rtmp0 += rtmp * DSDX[INDEX3(s, 0, q, p.numShapes, DIM)];
 
236
                                            rtmp1 += rtmp * DSDX[INDEX3(s, 1, q, p.numShapes, DIM)];
 
237
                                            rtmp2 += rtmp * DSDX[INDEX3(s, 2, q, p.numShapes, DIM)];
 
238
                                        }
 
239
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] +=
 
240
                                            rtmp0 * B_p[0] + rtmp1 * B_p[1] + rtmp2 * B_p[2];
 
241
                                    }
 
242
                                }
 
243
                            }
 
244
                        }
 
245
                      /**************************************************************/
 
246
                        /*   process C: */
 
247
                      /**************************************************************/
 
248
                        if (NULL != C_p)
 
249
                        {
 
250
                            add_EM_S = TRUE;
 
251
                            if (extendedC)
 
252
                            {
 
253
                                C_q = &(C_p[INDEX3(0, 0, 0, DIM, p.numQuad)]);
 
254
                                for (s = 0; s < p.numShapes; s++)
 
255
                                {
 
256
                                    for (r = 0; r < p.numShapes; r++)
 
257
                                    {
 
258
                                        rtmp = 0;
 
259
                                        for (q = 0; q < p.numQuad; q++)
 
260
                                        {
 
261
                                            rtmp += vol * S[INDEX2(s, q, p.numShapes)] *
 
262
                                                (C_q[INDEX2(0, q, DIM)] *
 
263
                                                 DSDX[INDEX3(r, 0, q, p.numShapes, DIM)] +
 
264
                                                 C_q[INDEX2(1, q, DIM)] *
 
265
                                                 DSDX[INDEX3(r, 1, q, p.numShapes, DIM)] +
 
266
                                                 C_q[INDEX2(2, q, DIM)] * DSDX[INDEX3(r, 2, q, p.numShapes, DIM)]);
 
267
                                        }
 
268
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] += rtmp;
 
269
                                    }
 
270
                                }
 
271
                            }
 
272
                            else
 
273
                            {
 
274
                                for (s = 0; s < p.numShapes; s++)
 
275
                                {
 
276
                                    for (r = 0; r < p.numShapes; r++)
 
277
                                    {
 
278
                                        rtmp0 = 0;
 
279
                                        rtmp1 = 0;
 
280
                                        rtmp2 = 0;
 
281
                                        for (q = 0; q < p.numQuad; q++)
 
282
                                        {
 
283
                                            rtmp = vol * S[INDEX2(s, q, p.numShapes)];
 
284
                                            rtmp0 += rtmp * DSDX[INDEX3(r, 0, q, p.numShapes, DIM)];
 
285
                                            rtmp1 += rtmp * DSDX[INDEX3(r, 1, q, p.numShapes, DIM)];
 
286
                                            rtmp2 += rtmp * DSDX[INDEX3(r, 2, q, p.numShapes, DIM)];
 
287
                                        }
 
288
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] +=
 
289
                                            rtmp0 * C_p[0] + rtmp1 * C_p[1] + rtmp2 * C_p[2];
 
290
                                    }
 
291
                                }
 
292
                            }
 
293
                        }
 
294
                      /************************************************************* */
 
295
                        /* process D */
 
296
                      /**************************************************************/
 
297
                        if (NULL != D_p)
 
298
                        {
 
299
                            add_EM_S = TRUE;
 
300
                            if (extendedD)
 
301
                            {
 
302
                                D_q = &(D_p[INDEX2(0, 0, p.numQuad)]);
 
303
                                for (s = 0; s < p.numShapes; s++)
 
304
                                {
 
305
                                    for (r = 0; r < p.numShapes; r++)
 
306
                                    {
 
307
                                        rtmp = 0;
 
308
                                        for (q = 0; q < p.numQuad; q++)
 
309
                                            rtmp +=
 
310
                                                vol * S[INDEX2(s, q, p.numShapes)] * D_q[q] *
 
311
                                                S[INDEX2(r, q, p.numShapes)];
 
312
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] += rtmp;
 
313
                                    }
 
314
                                }
 
315
                            }
 
316
                            else
 
317
                            {
 
318
                                for (s = 0; s < p.numShapes; s++)
 
319
                                {
 
320
                                    for (r = 0; r < p.numShapes; r++)
 
321
                                    {
 
322
                                        rtmp = 0;
 
323
                                        for (q = 0; q < p.numQuad; q++)
 
324
                                            rtmp += vol * S[INDEX2(s, q, p.numShapes)] * S[INDEX2(r, q, p.numShapes)];
 
325
                                        EM_S[INDEX4(0, 0, s, r, p.numEqu, p.numComp, p.numShapes)] += rtmp * D_p[0];
 
326
                                    }
 
327
                                }
 
328
                            }
 
329
                        }
 
330
                      /**************************************************************/
 
331
                        /*   process X: */
 
332
                      /**************************************************************/
 
333
                        if (NULL != X_p)
 
334
                        {
 
335
                            add_EM_F = TRUE;
 
336
                            if (extendedX)
 
337
                            {
 
338
                                X_q = &(X_p[INDEX3(0, 0, 0, DIM, p.numQuad)]);
 
339
                                for (s = 0; s < p.numShapes; s++)
 
340
                                {
 
341
                                    rtmp = 0;
 
342
                                    for (q = 0; q < p.numQuad; q++)
 
343
                                    {
 
344
                                        rtmp +=
 
345
                                            vol * (DSDX[INDEX3(s, 0, q, p.numShapes, DIM)] *
 
346
                                                   X_q[INDEX2(0, q, DIM)] +
 
347
                                                   DSDX[INDEX3(s, 1, q, p.numShapes, DIM)] *
 
348
                                                   X_q[INDEX2(1, q, DIM)] +
 
349
                                                   DSDX[INDEX3(s, 2, q, p.numShapes, DIM)] * X_q[INDEX2(2, q, DIM)]);
 
350
                                    }
 
351
                                    EM_F[INDEX2(0, s, p.numEqu)] += rtmp;
 
352
                                }
 
353
                            }
 
354
                            else
 
355
                            {
 
356
                                for (s = 0; s < p.numShapes; s++)
 
357
                                {
 
358
                                    rtmp0 = 0;
 
359
                                    rtmp1 = 0;
 
360
                                    rtmp2 = 0;
 
361
                                    for (q = 0; q < p.numQuad; q++)
 
362
                                    {
 
363
                                        rtmp0 += vol * DSDX[INDEX3(s, 0, q, p.numShapes, DIM)];
 
364
                                        rtmp1 += vol * DSDX[INDEX3(s, 1, q, p.numShapes, DIM)];
 
365
                                        rtmp2 += vol * DSDX[INDEX3(s, 2, q, p.numShapes, DIM)];
 
366
                                    }
 
367
                                    EM_F[INDEX2(0, s, p.numEqu)] += rtmp0 * X_p[0] + rtmp1 * X_p[1] + rtmp2 * X_p[2];
 
368
                                }
 
369
                            }
 
370
                        }
 
371
                     /**************************************************************/
 
372
                        /*   process Y: */
 
373
                     /**************************************************************/
 
374
                        if (NULL != Y_p)
 
375
                        {
 
376
                            add_EM_F = TRUE;
 
377
                            if (extendedY)
 
378
                            {
 
379
                                Y_q = &(Y_p[INDEX2(0, 0, p.numQuad)]);
 
380
                                for (s = 0; s < p.numShapes; s++)
 
381
                                {
 
382
                                    rtmp = 0;
 
383
                                    for (q = 0; q < p.numQuad; q++)
 
384
                                        rtmp += vol * S[INDEX2(s, q, p.numShapes)] * Y_q[q];
 
385
                                    EM_F[INDEX2(0, s, p.numEqu)] += rtmp;
 
386
                                }
 
387
                            }
 
388
                            else
 
389
                            {
 
390
                                for (s = 0; s < p.numShapes; s++)
 
391
                                {
 
392
                                    rtmp = 0;
 
393
                                    for (q = 0; q < p.numQuad; q++)
 
394
                                        rtmp += vol * S[INDEX2(s, q, p.numShapes)];
 
395
                                    EM_F[INDEX2(0, s, p.numEqu)] += rtmp * Y_p[0];
 
396
                                }
 
397
                            }
 
398
                        }
 
399
                       /***********************************************************************************************/
 
400
                        /* add the element matrices onto the matrix and right hand side                                */
 
401
                       /***********************************************************************************************/
 
402
 
 
403
                        for (q = 0; q < p.numShapes; q++)
 
404
                            row_index[q] = p.row_DOF[elements->Nodes[INDEX2(q, e, p.NN)]];
 
405
 
 
406
                        if (add_EM_F)
 
407
                            Dudley_Util_AddScatter(p.numShapes, row_index, p.numEqu, EM_F, F_p, p.row_DOF_UpperBound);
 
408
                        if (add_EM_S)
 
409
                            Dudley_Assemble_addToSystemMatrix(Mat, p.numShapes, row_index, p.numEqu,
 
410
                                                              p.numShapes, row_index, p.numComp, EM_S);
 
411
 
 
412
                    }           /* end color check */
 
413
                }               /* end element loop */
 
414
            }                   /* end color loop */
 
415
 
 
416
            THREAD_MEMFREE(EM_S);
 
417
            THREAD_MEMFREE(EM_F);
 
418
            THREAD_MEMFREE(row_index);
 
419
 
 
420
        }                       /* end of pointer check */
 
421
    }                           /* end parallel region */
 
422
}