543 lines
15 KiB
C
543 lines
15 KiB
C
/*BHEADER**********************************************************************
|
|
* Copyright (c) 2007, Lawrence Livermore National Security, LLC.
|
|
* Produced at the Lawrence Livermore National Laboratory.
|
|
* Written by the HYPRE team. UCRL-CODE-222953.
|
|
* All rights reserved.
|
|
*
|
|
* This file is part of HYPRE (see http://www.llnl.gov/CASC/hypre/).
|
|
* Please see the COPYRIGHT_and_LICENSE file for the copyright notice,
|
|
* disclaimer, contact information and the GNU Lesser General Public License.
|
|
*
|
|
* HYPRE is free software; you can redistribute it and/or modify it under the
|
|
* terms of the GNU General Public License (as published by the Free Software
|
|
* Foundation) version 2.1 dated February 1999.
|
|
*
|
|
* HYPRE is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
* WARRANTY; without even the IMPLIED WARRANTY OF MERCHANTABILITY or FITNESS
|
|
* FOR A PARTICULAR PURPOSE. See the terms and conditions of the GNU General
|
|
* Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*
|
|
* $Revision$
|
|
***********************************************************************EHEADER*/
|
|
|
|
|
|
|
|
|
|
|
|
#include "headers.h"
|
|
|
|
/*--------------------------------------------------------------------------
|
|
* hypre_GenerateVarDifConv
|
|
*--------------------------------------------------------------------------*/
|
|
|
|
HYPRE_ParCSRMatrix
|
|
GenerateVarDifConv( MPI_Comm comm,
|
|
int nx,
|
|
int ny,
|
|
int nz,
|
|
int P,
|
|
int Q,
|
|
int R,
|
|
int p,
|
|
int q,
|
|
int r,
|
|
double eps,
|
|
HYPRE_ParVector *rhs_ptr)
|
|
{
|
|
hypre_ParCSRMatrix *A;
|
|
hypre_CSRMatrix *diag;
|
|
hypre_CSRMatrix *offd;
|
|
hypre_ParVector *par_rhs;
|
|
hypre_Vector *rhs;
|
|
double *rhs_data;
|
|
|
|
int *diag_i;
|
|
int *diag_j;
|
|
double *diag_data;
|
|
|
|
int *offd_i;
|
|
int *offd_j;
|
|
double *offd_data;
|
|
|
|
int *global_part;
|
|
int ix, iy, iz;
|
|
int cnt, o_cnt;
|
|
int local_num_rows;
|
|
int *col_map_offd;
|
|
int row_index;
|
|
int i,j;
|
|
|
|
int nx_local, ny_local, nz_local;
|
|
int nx_size, ny_size, nz_size;
|
|
int num_cols_offd;
|
|
int grid_size;
|
|
|
|
int *nx_part;
|
|
int *ny_part;
|
|
int *nz_part;
|
|
|
|
int num_procs, my_id;
|
|
int P_busy, Q_busy, R_busy;
|
|
|
|
double hhx, hhy, hhz;
|
|
double xx, yy, zz;
|
|
double afp, afm, bfp, bfm, cfp, cfm, df, ef, ff, gf;
|
|
|
|
MPI_Comm_size(comm,&num_procs);
|
|
MPI_Comm_rank(comm,&my_id);
|
|
|
|
grid_size = nx*ny*nz;
|
|
|
|
hypre_GeneratePartitioning(nx,P,&nx_part);
|
|
hypre_GeneratePartitioning(ny,Q,&ny_part);
|
|
hypre_GeneratePartitioning(nz,R,&nz_part);
|
|
|
|
global_part = hypre_CTAlloc(int,P*Q*R+1);
|
|
|
|
global_part[0] = 0;
|
|
cnt = 1;
|
|
for (iz = 0; iz < R; iz++)
|
|
{
|
|
nz_size = nz_part[iz+1]-nz_part[iz];
|
|
for (iy = 0; iy < Q; iy++)
|
|
{
|
|
ny_size = ny_part[iy+1]-ny_part[iy];
|
|
for (ix = 0; ix < P; ix++)
|
|
{
|
|
nx_size = nx_part[ix+1] - nx_part[ix];
|
|
global_part[cnt] = global_part[cnt-1];
|
|
global_part[cnt++] += nx_size*ny_size*nz_size;
|
|
}
|
|
}
|
|
}
|
|
|
|
nx_local = nx_part[p+1] - nx_part[p];
|
|
ny_local = ny_part[q+1] - ny_part[q];
|
|
nz_local = nz_part[r+1] - nz_part[r];
|
|
|
|
my_id = r*(P*Q) + q*P + p;
|
|
num_procs = P*Q*R;
|
|
|
|
local_num_rows = nx_local*ny_local*nz_local;
|
|
diag_i = hypre_CTAlloc(int, local_num_rows+1);
|
|
offd_i = hypre_CTAlloc(int, local_num_rows+1);
|
|
rhs_data = hypre_CTAlloc(double, local_num_rows);
|
|
|
|
P_busy = hypre_min(nx,P);
|
|
Q_busy = hypre_min(ny,Q);
|
|
R_busy = hypre_min(nz,R);
|
|
|
|
num_cols_offd = 0;
|
|
if (p) num_cols_offd += ny_local*nz_local;
|
|
if (p < P_busy-1) num_cols_offd += ny_local*nz_local;
|
|
if (q) num_cols_offd += nx_local*nz_local;
|
|
if (q < Q_busy-1) num_cols_offd += nx_local*nz_local;
|
|
if (r) num_cols_offd += nx_local*ny_local;
|
|
if (r < R_busy-1) num_cols_offd += nx_local*ny_local;
|
|
|
|
if (!local_num_rows) num_cols_offd = 0;
|
|
|
|
col_map_offd = hypre_CTAlloc(int, num_cols_offd);
|
|
|
|
hhx = 1.0/(double)(nx+1);
|
|
hhy = 1.0/(double)(ny+1);
|
|
hhz = 1.0/(double)(nz+1);
|
|
|
|
cnt = 1;
|
|
o_cnt = 1;
|
|
diag_i[0] = 0;
|
|
offd_i[0] = 0;
|
|
for (iz = nz_part[r]; iz < nz_part[r+1]; iz++)
|
|
{
|
|
for (iy = ny_part[q]; iy < ny_part[q+1]; iy++)
|
|
{
|
|
for (ix = nx_part[p]; ix < nx_part[p+1]; ix++)
|
|
{
|
|
diag_i[cnt] = diag_i[cnt-1];
|
|
offd_i[o_cnt] = offd_i[o_cnt-1];
|
|
diag_i[cnt]++;
|
|
if (iz > nz_part[r])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (iz)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
if (iy > ny_part[q])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (iy)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
if (ix > nx_part[p])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (ix)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
if (ix+1 < nx_part[p+1])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (ix+1 < nx)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
if (iy+1 < ny_part[q+1])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (iy+1 < ny)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
if (iz+1 < nz_part[r+1])
|
|
diag_i[cnt]++;
|
|
else
|
|
{
|
|
if (iz+1 < nz)
|
|
{
|
|
offd_i[o_cnt]++;
|
|
}
|
|
}
|
|
cnt++;
|
|
o_cnt++;
|
|
}
|
|
}
|
|
}
|
|
|
|
diag_j = hypre_CTAlloc(int, diag_i[local_num_rows]);
|
|
diag_data = hypre_CTAlloc(double, diag_i[local_num_rows]);
|
|
|
|
if (num_procs > 1)
|
|
{
|
|
offd_j = hypre_CTAlloc(int, offd_i[local_num_rows]);
|
|
offd_data = hypre_CTAlloc(double, offd_i[local_num_rows]);
|
|
}
|
|
|
|
row_index = 0;
|
|
cnt = 0;
|
|
o_cnt = 0;
|
|
for (iz = nz_part[r]; iz < nz_part[r+1]; iz++)
|
|
{
|
|
zz = (double)(iz+1)*hhz;
|
|
for (iy = ny_part[q]; iy < ny_part[q+1]; iy++)
|
|
{
|
|
yy = (double)(iy+1)*hhy;
|
|
for (ix = nx_part[p]; ix < nx_part[p+1]; ix++)
|
|
{
|
|
xx = (double)(ix+1)*hhx;
|
|
afp = eps*afun(xx+0.5*hhx,yy,zz)/hhx/hhx;
|
|
afm = eps*afun(xx-0.5*hhx,yy,zz)/hhx/hhx;
|
|
bfp = eps*bfun(xx,yy+0.5*hhy,zz)/hhy/hhy;
|
|
bfm = eps*bfun(xx,yy-0.5*hhy,zz)/hhy/hhy;
|
|
cfp = eps*cfun(xx,yy,zz+0.5*hhz)/hhz/hhz;
|
|
cfm = eps*cfun(xx,yy,zz-0.5*hhz)/hhz/hhz;
|
|
df = dfun(xx,yy,zz)/hhx;
|
|
ef = efun(xx,yy,zz)/hhy;
|
|
ff = ffun(xx,yy,zz)/hhz;
|
|
gf = gfun(xx,yy,zz);
|
|
diag_j[cnt] = row_index;
|
|
diag_data[cnt++] = afp+afm+bfp+bfm+cfp+cfm+gf-df-ef-ff;
|
|
rhs_data[row_index] = rfun(xx,yy,zz);
|
|
if (ix == 0) rhs_data[row_index] += afm*bndfun(0,yy,zz);
|
|
if (iy == 0) rhs_data[row_index] += bfm*bndfun(xx,0,zz);
|
|
if (iz == 0) rhs_data[row_index] += cfm*bndfun(xx,yy,0);
|
|
if (ix+1 == nx) rhs_data[row_index] += (afp-df)*bndfun(1.0,yy,zz);
|
|
if (iy+1 == ny) rhs_data[row_index] += (bfp-ef)*bndfun(xx,1.0,zz);
|
|
if (iz+1 == nz) rhs_data[row_index] += (cfp-ff)*bndfun(xx,yy,1.0);
|
|
if (iz > nz_part[r])
|
|
{
|
|
diag_j[cnt] = row_index-nx_local*ny_local;
|
|
diag_data[cnt++] = -cfm;
|
|
}
|
|
else
|
|
{
|
|
if (iz)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix,iy,iz-1,p,q,r-1,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -cfm;
|
|
}
|
|
}
|
|
if (iy > ny_part[q])
|
|
{
|
|
diag_j[cnt] = row_index-nx_local;
|
|
diag_data[cnt++] = -bfm;
|
|
}
|
|
else
|
|
{
|
|
if (iy)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix,iy-1,iz,p,q-1,r,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -bfm;
|
|
}
|
|
}
|
|
if (ix > nx_part[p])
|
|
{
|
|
diag_j[cnt] = row_index-1;
|
|
diag_data[cnt++] = -afm;
|
|
}
|
|
else
|
|
{
|
|
if (ix)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix-1,iy,iz,p-1,q,r,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -afm;
|
|
}
|
|
}
|
|
if (ix+1 < nx_part[p+1])
|
|
{
|
|
diag_j[cnt] = row_index+1;
|
|
diag_data[cnt++] = -afp+df;
|
|
}
|
|
else
|
|
{
|
|
if (ix+1 < nx)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix+1,iy,iz,p+1,q,r,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -afp+df;
|
|
}
|
|
}
|
|
if (iy+1 < ny_part[q+1])
|
|
{
|
|
diag_j[cnt] = row_index+nx_local;
|
|
diag_data[cnt++] = -bfp +ef;
|
|
}
|
|
else
|
|
{
|
|
if (iy+1 < ny)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix,iy+1,iz,p,q+1,r,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -bfp+ef;
|
|
}
|
|
}
|
|
if (iz+1 < nz_part[r+1])
|
|
{
|
|
diag_j[cnt] = row_index+nx_local*ny_local;
|
|
diag_data[cnt++] = -cfp+ff;
|
|
}
|
|
else
|
|
{
|
|
if (iz+1 < nz)
|
|
{
|
|
offd_j[o_cnt] = hypre_map(ix,iy,iz+1,p,q,r+1,P,Q,R,
|
|
nx_part,ny_part,nz_part,global_part);
|
|
offd_data[o_cnt++] = -cfp+ff;
|
|
}
|
|
}
|
|
row_index++;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (num_procs > 1)
|
|
{
|
|
for (i=0; i < num_cols_offd; i++)
|
|
col_map_offd[i] = offd_j[i];
|
|
|
|
qsort0(col_map_offd, 0, num_cols_offd-1);
|
|
|
|
for (i=0; i < num_cols_offd; i++)
|
|
for (j=0; j < num_cols_offd; j++)
|
|
if (offd_j[i] == col_map_offd[j])
|
|
{
|
|
offd_j[i] = j;
|
|
break;
|
|
}
|
|
}
|
|
|
|
par_rhs = hypre_ParVectorCreate(comm, grid_size, global_part);
|
|
rhs = hypre_ParVectorLocalVector(par_rhs);
|
|
hypre_VectorData(rhs) = rhs_data;
|
|
|
|
A = hypre_ParCSRMatrixCreate(comm, grid_size, grid_size,
|
|
global_part, global_part, num_cols_offd,
|
|
diag_i[local_num_rows],
|
|
offd_i[local_num_rows]);
|
|
|
|
hypre_ParCSRMatrixColMapOffd(A) = col_map_offd;
|
|
|
|
diag = hypre_ParCSRMatrixDiag(A);
|
|
hypre_CSRMatrixI(diag) = diag_i;
|
|
hypre_CSRMatrixJ(diag) = diag_j;
|
|
hypre_CSRMatrixData(diag) = diag_data;
|
|
|
|
offd = hypre_ParCSRMatrixOffd(A);
|
|
hypre_CSRMatrixI(offd) = offd_i;
|
|
if (num_cols_offd)
|
|
{
|
|
hypre_CSRMatrixJ(offd) = offd_j;
|
|
hypre_CSRMatrixData(offd) = offd_data;
|
|
}
|
|
|
|
hypre_TFree(nx_part);
|
|
hypre_TFree(ny_part);
|
|
hypre_TFree(nz_part);
|
|
|
|
*rhs_ptr = (HYPRE_ParVector) par_rhs;
|
|
|
|
return (HYPRE_ParCSRMatrix) A;
|
|
}
|
|
|
|
double afun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
/* value = 1.0 + 1000.0*fabs(xx-yy); */
|
|
if ((xx < 0.1 && yy < 0.1 && zz < 0.1)
|
|
|| (xx < 0.1 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz < 0.1)
|
|
|| (xx > 0.9 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz > 0.9)
|
|
|| (xx > 0.9 && yy > 0.9 && zz > 0.9))
|
|
value = 0.01;
|
|
else if (xx >= 0.1 && xx <= 0.9
|
|
&& yy >= 0.1 && yy <= 0.9
|
|
&& zz >= 0.1 && zz <= 0.9)
|
|
value = 1000.0;
|
|
else
|
|
value = 1.0 ;
|
|
/* double value, pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = cos(pi*xx)*cos(pi*yy); */
|
|
return value;
|
|
}
|
|
|
|
double bfun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
/* value = 1.0 + 1000.0*fabs(xx-yy); */
|
|
if ((xx < 0.1 && yy < 0.1 && zz < 0.1)
|
|
|| (xx < 0.1 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz < 0.1)
|
|
|| (xx > 0.9 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz > 0.9)
|
|
|| (xx > 0.9 && yy > 0.9 && zz > 0.9))
|
|
value = 0.01;
|
|
else if (xx >= 0.1 && xx <= 0.9
|
|
&& yy >= 0.1 && yy <= 0.9
|
|
&& zz >= 0.1 && zz <= 0.9)
|
|
value = 1000.0;
|
|
else
|
|
value = 1.0 ;
|
|
/* double value, pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = 1.0 - 2.0*xx;
|
|
value = cos(pi*xx)*cos(pi*yy); */
|
|
/* double value;
|
|
value = 1.0 + 1000.0 * fabs(xx-yy);
|
|
double value, x0, y0;
|
|
x0 = fabs(xx - 0.5);
|
|
y0 = fabs(yy - 0.5);
|
|
if (y0 > x0) x0 = y0;
|
|
if (x0 >= 0.125 && x0 <= 0.25)
|
|
value = 1.0;
|
|
else
|
|
value = 1000.0;*/
|
|
return value;
|
|
}
|
|
|
|
double cfun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
if ((xx < 0.1 && yy < 0.1 && zz < 0.1)
|
|
|| (xx < 0.1 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz < 0.1)
|
|
|| (xx > 0.9 && yy > 0.9 && zz < 0.1)
|
|
|| (xx > 0.9 && yy < 0.1 && zz > 0.9)
|
|
|| (xx < 0.1 && yy > 0.9 && zz > 0.9)
|
|
|| (xx > 0.9 && yy > 0.9 && zz > 0.9))
|
|
value = 0.01;
|
|
else if (xx >= 0.1 && xx <= 0.9
|
|
&& yy >= 0.1 && yy <= 0.9
|
|
&& zz >= 0.1 && zz <= 0.9)
|
|
value = 1000.0;
|
|
else
|
|
value = 1.0 ;
|
|
/*if (xx <= 0.75 && yy <= 0.75 && zz <= 0.75)
|
|
value = 0.1;
|
|
else if (xx > 0.75 && yy > 0.75 && zz > 0.75)
|
|
value = 100000;
|
|
else
|
|
value = 1.0 ;*/
|
|
return value;
|
|
}
|
|
|
|
double dfun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
/*double pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = -sin(pi*xx)*cos(pi*yy);*/
|
|
value = 0;
|
|
return value;
|
|
}
|
|
|
|
double efun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
/*double pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = sin(pi*yy)*cos(pi*xx);*/
|
|
value = 0;
|
|
return value;
|
|
}
|
|
|
|
double ffun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
value = 0.0;
|
|
return value;
|
|
}
|
|
|
|
double gfun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
value = 0.0;
|
|
return value;
|
|
}
|
|
|
|
double rfun(double xx, double yy, double zz)
|
|
{
|
|
/* double value, pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = -4.0*pi*pi*sin(pi*xx)*sin(pi*yy)*cos(pi*xx)*cos(pi*yy); */
|
|
double value;
|
|
/* value = xx*(1.0-xx)*yy*(1.0-yy); */
|
|
value = 1.0;
|
|
return value;
|
|
}
|
|
|
|
double bndfun(double xx, double yy, double zz)
|
|
{
|
|
double value;
|
|
/*double pi;
|
|
pi = 4.0 * atan(1.0);
|
|
value = sin(pi*xx)+sin(13*pi*xx)+sin(pi*yy)+sin(13*pi*yy);*/
|
|
value = 0.0;
|
|
return value;
|
|
}
|