nek/bps/bps.usr

86a4271fSThilina RathnayakeC Copyright (c) 2017, Lawrence Livermore National Security, LLC. Produced at
86a4271fSThilina RathnayakeC the Lawrence Livermore National Laboratory. LLNL-CODE-734707. All Rights
86a4271fSThilina RathnayakeC reserved. See files LICENSE and NOTICE for details.
86a4271fSThilina RathnayakeC
86a4271fSThilina RathnayakeC This file is part of CEED, a collection of benchmarks, miniapps, software
86a4271fSThilina RathnayakeC libraries and APIs for efficient high-order finite element and spectral
86a4271fSThilina RathnayakeC element discretizations for exascale applications. For more information and
86a4271fSThilina RathnayakeC source code availability see http://github.com/ceed.
86a4271fSThilina RathnayakeC
86a4271fSThilina RathnayakeC The CEED research is supported by the Exascale Computing Project (17-SC-20-SC)
86a4271fSThilina RathnayakeC a collaborative effort of two U.S. Department of Energy organizations (Office
86a4271fSThilina RathnayakeC of Science and the National Nuclear Security Administration) responsible for
86a4271fSThilina RathnayakeC the planning and preparation of a capable exascale ecosystem, including
86a4271fSThilina RathnayakeC software, applications, hardware, advanced system engineering and early
86a4271fSThilina RathnayakeC testbed platforms, in support of the nation's exascale computing imperative.
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC> @file
86a4271fSThilina RathnayakeC> Mass and diffusion operators examples using Nek5000
dc8efd83SLeila GhaffariC_TESTARGS(name="BP1") -c {ceed_resource} -e bp1 -n 1 -b 4 -test
dc8efd83SLeila GhaffariC_TESTARGS(name="BP3") -c {ceed_resource} -e bp3 -n 1 -b 4 -test
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine masssetupf(ctx,q,u1,u2,u3,u4,u5,u6,u7,
86a4271fSThilina Rathnayake     $  u8,u9,u10,u11,u12,u13,u14,u15,u16,v1,v2,v3,v4,v5,v6,v7,v8,
86a4271fSThilina Rathnayake     $  v9,v10,v11,v12,v13,v14,v15,v16,ierr)
86a4271fSThilina RathnayakeC     Set up mass operator
86a4271fSThilina RathnayakeC     Input: u1,u2,u3,q             Output: v1,v2,ierr
86a4271fSThilina Rathnayake      integer q,ierr
86a4271fSThilina Rathnayake      real*8 ctx(1)
86a4271fSThilina Rathnayake      real*8 u1(3*q)
86a4271fSThilina Rathnayake      real*8 u2(9*q)
86a4271fSThilina Rathnayake      real*8 u3(q)
86a4271fSThilina Rathnayake      real*8 v1(q)
86a4271fSThilina Rathnayake      real*8 v2(q)
86a4271fSThilina Rathnayake      real*8 a11,a12,a13,a21,a22,a23,a31,a32,a33
86a4271fSThilina Rathnayake      real*8 g11,g12,g13,g21,g22,g23,g31,g32,g33
86a4271fSThilina Rathnayake      real*8 jacmq
86a4271fSThilina Rathnayake
ee07ded2SValeria BarraC     Quadrature Point Loop
86a4271fSThilina Rathnayake      do i=1,q
86a4271fSThilina Rathnayake        a11=u2(i+q*0)
86a4271fSThilina Rathnayake        a12=u2(i+q*3)
86a4271fSThilina Rathnayake        a13=u2(i+q*6)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        a21=u2(i+q*1)
86a4271fSThilina Rathnayake        a22=u2(i+q*4)
86a4271fSThilina Rathnayake        a23=u2(i+q*7)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        a31=u2(i+q*2)
86a4271fSThilina Rathnayake        a32=u2(i+q*5)
86a4271fSThilina Rathnayake        a33=u2(i+q*8)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g11 = (a22*a33-a23*a32)
86a4271fSThilina Rathnayake        g12 = (a13*a32-a33*a12)
86a4271fSThilina Rathnayake        g13 = (a12*a23-a22*a13)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g21 = (a23*a31-a21*a33)
86a4271fSThilina Rathnayake        g22 = (a11*a33-a31*a13)
86a4271fSThilina Rathnayake        g23 = (a13*a21-a23*a11)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g31 = (a21*a32-a22*a31)
86a4271fSThilina Rathnayake        g32 = (a12*a31-a32*a11)
86a4271fSThilina Rathnayake        g33 = (a11*a22-a21*a12)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        jacmq = a11*g11+a21*g12+a31*g13
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC       Rho
86a4271fSThilina Rathnayake        v1(i)=u3(i)*jacmq
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC       RHS
86a4271fSThilina Rathnayake        v2(i)=u3(i)*jacmq
86a4271fSThilina Rathnayake     $             *dsqrt(u1(i+q*0)*u1(i+q*0)
86a4271fSThilina Rathnayake     $                   +u1(i+q*1)*u1(i+q*1)
86a4271fSThilina Rathnayake     $                   +u1(i+q*2)*u1(i+q*2))
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ierr=0
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine massf(ctx,q,u1,u2,u3,u4,u5,u6,u7,
86a4271fSThilina Rathnayake     $  u8,u9,u10,u11,u12,u13,u14,u15,u16,v1,v2,v3,v4,v5,v6,v7,v8,
86a4271fSThilina Rathnayake     $  v9,v10,v11,v12,v13,v14,v15,v16,ierr)
86a4271fSThilina RathnayakeC     Apply mass operator
86a4271fSThilina RathnayakeC     Input: u1,u2,q                Output: v1,ierr
86a4271fSThilina Rathnayake      integer q,ierr
86a4271fSThilina Rathnayake      real*8 ctx(1)
86a4271fSThilina Rathnayake      real*8 u1(q)
86a4271fSThilina Rathnayake      real*8 u2(q)
86a4271fSThilina Rathnayake      real*8 v1(q)
86a4271fSThilina Rathnayake
ee07ded2SValeria BarraC     Quadrature Point Loop
86a4271fSThilina Rathnayake      do i=1,q
86a4271fSThilina Rathnayake        v1(i)=u2(i)*u1(i)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ierr=0
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine diffsetupf(ctx,q,u1,u2,u3,u4,u5,u6,u7,
86a4271fSThilina Rathnayake     $  u8,u9,u10,u11,u12,u13,u14,u15,u16,v1,v2,v3,v4,v5,v6,v7,v8,
86a4271fSThilina Rathnayake     $  v9,v10,v11,v12,v13,v14,v15,v16,ierr)
86a4271fSThilina RathnayakeC     Set up diffusion operator
86a4271fSThilina RathnayakeC     Input: u1,u2,u3,q             Output: v1,v2,ierr
86a4271fSThilina Rathnayake      integer q,ierr
86a4271fSThilina Rathnayake      real*8 ctx(1)
86a4271fSThilina Rathnayake      real*8 u1(3*q)
86a4271fSThilina Rathnayake      real*8 u2(9*q)
86a4271fSThilina Rathnayake      real*8 u3(q)
86a4271fSThilina Rathnayake      real*8 v1(6*q)
86a4271fSThilina Rathnayake      real*8 v2(q)
86a4271fSThilina Rathnayake      real*8 a11,a12,a13,a21,a22,a23,a31,a32,a33
86a4271fSThilina Rathnayake      real*8 g11,g12,g13,g21,g22,g23,g31,g32,g33
86a4271fSThilina Rathnayake      real*8 jacmq,scl
86a4271fSThilina Rathnayake      real*8 c(3),k(3)
86a4271fSThilina Rathnayake
ee07ded2SValeria BarraC     Quadrature Point Loop
86a4271fSThilina Rathnayake      do i=1,q
86a4271fSThilina Rathnayake        pi = 3.14159265358979323846
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        c(1)=0.
86a4271fSThilina Rathnayake        c(2)=1.
86a4271fSThilina Rathnayake        c(3)=2.
86a4271fSThilina Rathnayake        k(1)=1.
86a4271fSThilina Rathnayake        k(2)=2.
86a4271fSThilina Rathnayake        k(3)=3.
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        a11=u2(i+q*0)
86a4271fSThilina Rathnayake        a12=u2(i+q*3)
86a4271fSThilina Rathnayake        a13=u2(i+q*6)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        a21=u2(i+q*1)
86a4271fSThilina Rathnayake        a22=u2(i+q*4)
86a4271fSThilina Rathnayake        a23=u2(i+q*7)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        a31=u2(i+q*2)
86a4271fSThilina Rathnayake        a32=u2(i+q*5)
86a4271fSThilina Rathnayake        a33=u2(i+q*8)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g11 = (a22*a33-a23*a32)
86a4271fSThilina Rathnayake        g12 = (a13*a32-a33*a12)
86a4271fSThilina Rathnayake        g13 = (a12*a23-a22*a13)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g21 = (a23*a31-a21*a33)
86a4271fSThilina Rathnayake        g22 = (a11*a33-a31*a13)
86a4271fSThilina Rathnayake        g23 = (a13*a21-a23*a11)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        g31 = (a21*a32-a22*a31)
86a4271fSThilina Rathnayake        g32 = (a12*a31-a32*a11)
86a4271fSThilina Rathnayake        g33 = (a11*a22-a21*a12)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        jacmq = a11*g11+a21*g12+a31*g13
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        scl = u3(i)/jacmq
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC       Geometric factors
288c0443SJeremy L ThompsonC       Stored in Voigt convention
288c0443SJeremy L ThompsonC       0 5 4
288c0443SJeremy L ThompsonC       5 1 3
288c0443SJeremy L ThompsonC       4 3 2
86a4271fSThilina Rathnayake        v1(i+0*q) = scl*(g11*g11+g12*g12+g13*g13) ! Grr
288c0443SJeremy L Thompson        v1(i+1*q) = scl*(g21*g21+g22*g22+g23*g23) ! Gss
288c0443SJeremy L Thompson        v1(i+2*q) = scl*(g31*g31+g32*g32+g33*g33) ! Gtt
288c0443SJeremy L Thompson        v1(i+3*q) = scl*(g21*g31+g22*g32+g23*g33) ! Gst
288c0443SJeremy L Thompson        v1(i+4*q) = scl*(g11*g31+g12*g32+g13*g33) ! Grt
288c0443SJeremy L Thompson        v1(i+5*q) = scl*(g11*g21+g12*g22+g13*g23) ! Grs
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC       RHS
86a4271fSThilina Rathnayake        v2(i) = u3(i)*jacmq*pi*pi
86a4271fSThilina Rathnayake     $            *dsin(pi*(c(1)+k(1)*u1(i+0*q)))
86a4271fSThilina Rathnayake     $            *dsin(pi*(c(2)+k(2)*u1(i+1*q)))
86a4271fSThilina Rathnayake     $            *dsin(pi*(c(3)+k(3)*u1(i+2*q)))
86a4271fSThilina Rathnayake     $            *(k(1)*k(1)+k(2)*k(2)+k(3)*k(3))
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ierr=0
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine diffusionf(ctx,q,u1,u2,u3,u4,u5,u6,u7,
86a4271fSThilina Rathnayake     $  u8,u9,u10,u11,u12,u13,u14,u15,u16,v1,v2,v3,v4,v5,v6,v7,v8,
86a4271fSThilina Rathnayake     $  v9,v10,v11,v12,v13,v14,v15,v16,ierr)
86a4271fSThilina RathnayakeC     Apply diffusion operator
86a4271fSThilina RathnayakeC     Input: u1,u2,q                Output: v1,ierr
86a4271fSThilina Rathnayake      integer q,ierr
86a4271fSThilina Rathnayake      real*8 ctx(1)
86a4271fSThilina Rathnayake      real*8 u1(3*q)
86a4271fSThilina Rathnayake      real*8 u2(6*q)
86a4271fSThilina Rathnayake      real*8 v1(3*q)
86a4271fSThilina Rathnayake
ee07ded2SValeria BarraC     Quadrature Point Loop
86a4271fSThilina Rathnayake      do i=1,q
86a4271fSThilina Rathnayake        v1(i+0*q)=
288c0443SJeremy L Thompson     $     u2(i+0*q)*u1(i)+u2(i+5*q)*u1(i+q)+u2(i+4*q)*u1(i+2*q)
86a4271fSThilina Rathnayake        v1(i+1*q)=
288c0443SJeremy L Thompson     $     u2(i+5*q)*u1(i)+u2(i+1*q)*u1(i+q)+u2(i+3*q)*u1(i+2*q)
86a4271fSThilina Rathnayake        v1(i+2*q)=
288c0443SJeremy L Thompson     $     u2(i+4*q)*u1(i)+u2(i+3*q)*u1(i+q)+u2(i+2*q)*u1(i+2*q)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ierr=0
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine set_h2_as_rhoJac_GL(h2,bmq,nxq)
86a4271fSThilina RathnayakeC     Set h2 as rhoJac
86a4271fSThilina RathnayakeC     Input: bmq,nxq                Output: h2
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      real*8 h2(1),bmq(1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      common /ctmp77/ wd(lxd),zd(lxd)
86a4271fSThilina Rathnayake      integer e,i,L
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call zwgl(zd,wd,nxq)  ! nxq = number of points
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      q = 1.0               ! Later, this can be a function of position...
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      L = 0
86a4271fSThilina Rathnayake      do e=1,lelt
86a4271fSThilina Rathnayake      do i=1,nxq**ldim
86a4271fSThilina Rathnayake         L=L+1
86a4271fSThilina Rathnayake         h2(L) = q*bmq(L)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine dist_fld_h1(e)
86a4271fSThilina RathnayakeC     Set distance initial condition for BP1
86a4271fSThilina RathnayakeC     Input:                        Output: e
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      real*8 x,y,z
86a4271fSThilina Rathnayake      real*8 e(1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      n=lx1*ly1*lz1*nelt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do i=1,n
86a4271fSThilina Rathnayake        x=xm1(i,1,1,1)
86a4271fSThilina Rathnayake        y=ym1(i,1,1,1)
86a4271fSThilina Rathnayake        z=zm1(i,1,1,1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        e(i) = dsqrt(x*x+y*y+z*z)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call dsavg(e)  ! This is requisite for random fields
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine sin_fld_h1(e)
86a4271fSThilina RathnayakeC     Set sine initial condition for BP3
86a4271fSThilina RathnayakeC     Input:                        Output: e
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      real*8 x,y,z
86a4271fSThilina Rathnayake      real*8 e(1)
86a4271fSThilina Rathnayake      real*8 c(3),k(3)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      n=lx1*ly1*lz1*nelt
86a4271fSThilina Rathnayake      pi = 3.14159265358979323846
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      c(1)=0.
86a4271fSThilina Rathnayake      c(2)=1.
86a4271fSThilina Rathnayake      c(3)=2.
86a4271fSThilina Rathnayake      k(1)=1.
86a4271fSThilina Rathnayake      k(2)=2.
86a4271fSThilina Rathnayake      k(3)=3.
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do i=1,n
86a4271fSThilina Rathnayake        x=xm1(i,1,1,1)
86a4271fSThilina Rathnayake        y=ym1(i,1,1,1)
86a4271fSThilina Rathnayake        z=zm1(i,1,1,1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        e(i) = dsin(pi*(c(1)+k(1)*x))
86a4271fSThilina Rathnayake     &        *dsin(pi*(c(2)+k(2)*y))
86a4271fSThilina Rathnayake     &        *dsin(pi*(c(3)+k(3)*z))
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call dsavg(e)  ! This is requisite for random fields
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine uservp(ix,iy,iz,eg) ! set variable properties
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'NEKUSE'
86a4271fSThilina Rathnayake      integer e,f,eg
86a4271fSThilina RathnayakeC     e = gllel(eg)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      udiff  = 0.0
86a4271fSThilina Rathnayake      utrans = 0.0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine userf(ix,iy,iz,eg) ! set acceleration term
86a4271fSThilina RathnayakeC
86a4271fSThilina RathnayakeC     Note: this is an acceleration term, NOT a force!
86a4271fSThilina RathnayakeC     Thus, ffx will subsequently be multiplied by rho(x,t).
86a4271fSThilina RathnayakeC
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'NEKUSE'
86a4271fSThilina Rathnayake      integer e,f,eg
86a4271fSThilina RathnayakeC     e = gllel(eg)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ffx = 0.0
86a4271fSThilina Rathnayake      ffy = 0.0
86a4271fSThilina Rathnayake      ffz = 0.0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine userq(i,j,k,eg) ! set source term
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'NEKUSE'
86a4271fSThilina Rathnayake      integer e,f,eg
86a4271fSThilina Rathnayake      e = gllel(eg)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      qvol   = 0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine userbc(ix,iy,iz,f,eg) ! set up boundary conditions
86a4271fSThilina RathnayakeC     NOTE ::: This subroutine MAY NOT be called by every process
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'NEKUSE'
86a4271fSThilina Rathnayake      integer e,f,eg
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ux   = 0.0
86a4271fSThilina Rathnayake      uy   = 0.0
86a4271fSThilina Rathnayake      uz   = 0.0
86a4271fSThilina Rathnayake      temp = 0.0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine useric(ix,iy,iz,eg) ! set up initial conditions
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'NEKUSE'
86a4271fSThilina Rathnayake      integer e,f,eg
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ux   = 0.0
86a4271fSThilina Rathnayake      uy   = 0.0
86a4271fSThilina Rathnayake      uz   = 0.0
86a4271fSThilina Rathnayake      temp = 0.0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine usrdat   ! This routine to modify element vertices
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine usrdat2  ! This routine to modify mesh coordinates
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      x0 = 0
86a4271fSThilina Rathnayake      x1 = 1
86a4271fSThilina Rathnayake      call rescale_x(xm1,x0,x1)
86a4271fSThilina Rathnayake      call rescale_x(ym1,x0,x1)
86a4271fSThilina Rathnayake      call rescale_x(zm1,x0,x1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      param(59)=1  ! Force Nek to use the "deformed element" formulation
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine usrdat3
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine xmask1   (r1,h2,nel)
86a4271fSThilina RathnayakeC     Apply zero Dirichlet boundary conditions
86a4271fSThilina RathnayakeC     Input: h2,nel                 Output: r1
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      real*8 r1(1),h2(1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      n=nx1*ny1*nz1*nel
86a4271fSThilina Rathnayake      do i=1,n
86a4271fSThilina Rathnayake         r1(i)=r1(i)*h2(i)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      function glrdif(x,y,n)
86a4271fSThilina RathnayakeC     Compute Linfty norm of (x-y)
86a4271fSThilina RathnayakeC     Input: x,y                    Output: n
86a4271fSThilina Rathnayake      real*8 x(n),y(n)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      dmx=0
86a4271fSThilina Rathnayake      xmx=0
86a4271fSThilina Rathnayake      ymx=0
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do i=1,n
86a4271fSThilina Rathnayake         diff=abs(x(i)-y(i))
86a4271fSThilina Rathnayake         dmx =max(dmx,diff)
86a4271fSThilina Rathnayake         xmx =max(xmx,x(i))
86a4271fSThilina Rathnayake         ymx =max(ymx,y(i))
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      xmx = max(xmx,ymx)
86a4271fSThilina Rathnayake      dmx = glmax(dmx,1) ! max across processors
86a4271fSThilina Rathnayake      xmx = glmax(xmx,1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (xmx.gt.0) then
86a4271fSThilina Rathnayake         glrdif = dmx/xmx
86a4271fSThilina Rathnayake      else
86a4271fSThilina Rathnayake         glrdif = -dmx   ! Negative indicates something strange
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine loc_grad3(ur,us,ut,u,N,D,Dt)
86a4271fSThilina RathnayakeC     3D transpose of local gradient
86a4271fSThilina RathnayakeC     Input: u,N,D,Dt               Output: ur,us,ut
86a4271fSThilina Rathnayake      real*8 ur(0:N,0:N,0:N),us(0:N,0:N,0:N),ut(0:N,0:N,0:N)
86a4271fSThilina Rathnayake      real*8 u (0:N,0:N,0:N)
86a4271fSThilina Rathnayake      real*8 D (0:N,0:N),Dt(0:N,0:N)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      m1 = N+1
86a4271fSThilina Rathnayake      m2 = m1*m1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call mxm(D ,m1,u(0,0,0),m1,ur,m2)
86a4271fSThilina Rathnayake      do k=0,N
86a4271fSThilina Rathnayake         call mxm(u(0,0,k),m1,Dt,m1,us(0,0,k),m1)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      call mxm(u(0,0,0),m2,Dt,m1,ut,m1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina Rathnayakec-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine loc_grad3t(u,ur,us,ut,N,D,Dt,w)
86a4271fSThilina RathnayakeC     3D transpose of local gradient
86a4271fSThilina RathnayakeC     Input: ur,us,ut,N,D,Dt        Output: u
86a4271fSThilina Rathnayake       real*8 u (0:N,0:N,0:N)
86a4271fSThilina Rathnayake       real*8 ur(0:N,0:N,0:N),us(0:N,0:N,0:N),ut(0:N,0:N,0:N)
86a4271fSThilina Rathnayake       real*8 D (0:N,0:N),Dt(0:N,0:N)
86a4271fSThilina Rathnayake       real*8 w (0:N,0:N,0:N)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake       m1 = N+1
86a4271fSThilina Rathnayake       m2 = m1*m1
86a4271fSThilina Rathnayake       m3 = m1*m1*m1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake       call mxm(Dt,m1,ur,m1,u(0,0,0),m2)
86a4271fSThilina Rathnayake       do k=0,N
86a4271fSThilina Rathnayake          call mxm(us(0,0,k),m1,D ,m1,w(0,0,k),m1)
86a4271fSThilina Rathnayake       enddo
86a4271fSThilina Rathnayake       call add2(u(0,0,0),w,m3)
86a4271fSThilina Rathnayake       call mxm(ut,m2,D ,m1,w,m1)
86a4271fSThilina Rathnayake       call add2(u(0,0,0),w,m3)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine geodatq(gf,bmq,w3mq,nxq)
86a4271fSThilina RathnayakeC     Routine to generate elemental geometric matrices on mesh 1
86a4271fSThilina RathnayakeC     (Gauss-Legendre Lobatto mesh).
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lg=3+3*(ldim-2),lzq=lx1+1,lxyd=lzq**ldim)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 gf(lg,nxq**ldim,lelt),bmq(nxq**ldim,lelt),w3mq(nxq,nxq,nxq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      common /ctmp1/ xr(lxyd),xs(lxyd),xt(lxyd)
86a4271fSThilina Rathnayake      common /sxrns/ yr(lxyd),ys(lxyd),yt(lxyd)
86a4271fSThilina Rathnayake     $ ,             zr(lxyd),zs(lxyd),zt(lxyd)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      common /ctmp77/ wd(lxd),zd(lxd)
86a4271fSThilina Rathnayake      common /dxmfine/ dxmq(lzq,lzq),dxtmq(lzq,lzq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      integer e
86a4271fSThilina Rathnayake      real*8 tmp(lxyd)
86a4271fSThilina Rathnayake      real*8 a11,a12,a13,a21,a22,a23,a31,a32,a33
86a4271fSThilina Rathnayake      real*8 g11,g12,g13,g21,g22,g23,g31,g32,g33
86a4271fSThilina Rathnayake      real*8 jacmq
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nxq.gt.lzq) call exitti('ABORT: recompile with lzq=$',nxq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call zwgl    (zd,wd,lzq)                            ! nxq = number of points
86a4271fSThilina Rathnayake      call gen_dgl (dxmq,dxtmq,lzq,lzq,tmp)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do k=1,nxq
86a4271fSThilina Rathnayake      do j=1,nxq
86a4271fSThilina Rathnayake      do i=1,nxq
86a4271fSThilina Rathnayake         w3mq(i,j,k) = wd(i)*wd(j)*wd(k)
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nxyzq = nxq**ldim
86a4271fSThilina Rathnayake      nxqm1 = lzq-1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do e=1,nelt
86a4271fSThilina Rathnayake         call intp_rstd (tmp,xm1(1,1,1,e),lx1,lzq,if3d,0) ! 0-->Fwd interpolation
86a4271fSThilina Rathnayake         call loc_grad3 (xr,xs,xt,tmp,nxqm1,dxmq,dxtmq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         call intp_rstd (tmp,ym1(1,1,1,e),lx1,lzq,if3d,0)
86a4271fSThilina Rathnayake         call loc_grad3 (yr,ys,yt,tmp,nxqm1,dxmq,dxtmq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         call intp_rstd (tmp,zm1(1,1,1,e),lx1,lzq,if3d,0)
86a4271fSThilina Rathnayake         call loc_grad3 (zr,zs,zt,tmp,nxqm1,dxmq,dxtmq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         do i=1,nxyzq
86a4271fSThilina Rathnayake            a11 = xr(i)
86a4271fSThilina Rathnayake            a12 = xs(i)
86a4271fSThilina Rathnayake            a13 = xt(i)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            a21 = yr(i)
86a4271fSThilina Rathnayake            a22 = ys(i)
86a4271fSThilina Rathnayake            a23 = yt(i)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            a31 = zr(i)
86a4271fSThilina Rathnayake            a32 = zs(i)
86a4271fSThilina Rathnayake            a33 = zt(i)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            g11 = (a22*a33-a23*a32)
86a4271fSThilina Rathnayake            g12 = (a13*a32-a33*a12)
86a4271fSThilina Rathnayake            g13 = (a12*a23-a22*a13)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            g21 = (a23*a31-a21*a33)
86a4271fSThilina Rathnayake            g22 = (a11*a33-a31*a13)
86a4271fSThilina Rathnayake            g23 = (a13*a21-a23*a11)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            g31 = (a21*a32-a22*a31)
86a4271fSThilina Rathnayake            g32 = (a12*a31-a32*a11)
86a4271fSThilina Rathnayake            g33 = (a11*a22-a21*a12)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            jacmq = a11*g11+a21*g12+a31*g13
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            bmq(i,e)  = w3mq(i,1,1)*jacmq
86a4271fSThilina Rathnayake            scale     = w3mq(i,1,1)/jacmq
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake            gf(1,i,e) = scale*(g11*g11+g12*g12+g13*g13) ! Grr
86a4271fSThilina Rathnayake            gf(2,i,e) = scale*(g11*g21+g12*g22+g13*g23) ! Grs
86a4271fSThilina Rathnayake            gf(3,i,e) = scale*(g11*g31+g12*g32+g13*g33) ! Grt
86a4271fSThilina Rathnayake            gf(4,i,e) = scale*(g21*g21+g22*g22+g23*g23) ! Gss
86a4271fSThilina Rathnayake            gf(5,i,e) = scale*(g21*g31+g22*g32+g23*g33) ! Gst
86a4271fSThilina Rathnayake            gf(6,i,e) = scale*(g31*g31+g32*g32+g33*g33) ! Gtt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine setprecn_bp1 (d,h1,h2)
86a4271fSThilina RathnayakeC     Generate diagonal preconditioner for Helmholtz operator
86a4271fSThilina RathnayakeC     Input: h1,h2                  Output: d
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lxyz=lx1*ly1*lz1,lg=3+3*(ldim-2))
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8    d(lx1,ly1,lz1,lelt),h1(lxyz,lelt),h2(lxyz,lelt)
86a4271fSThilina Rathnayake      integer e
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8         gf(lg,lx1,ly1,lz1,lelt) ! Equivalence new gf() data
86a4271fSThilina Rathnayake      equivalence (gf,g1m1)                  ! layout to g1m1...g6m1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 ysm1(ly1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nel   = nelfld(ifield)
86a4271fSThilina Rathnayake      n     = nel*lx1*ly1*lz1
86a4271fSThilina Rathnayake      nxyz  = lx1*ly1*lz1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call copy    (d,bm1,n)   ! Mass matrix preconditioning full mass matrix
86a4271fSThilina Rathnayake      call dssum   (d,nx1,ny1,nz1)
86a4271fSThilina Rathnayake      call invcol1 (d,n)
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call dsset(lx1,ly1,lz1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do 1000 e=1,nel
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        call rzero(d(1,1,1,e),nxyz)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        do 320 iz=1,lz1
86a4271fSThilina Rathnayake         do 320 iy=1,ly1
86a4271fSThilina Rathnayake         do 320 ix=1,lx1
86a4271fSThilina Rathnayake         do 320 iq=1,lx1
86a4271fSThilina Rathnayake           d(ix,iy,iz,e) = d(ix,iy,iz,e)
86a4271fSThilina Rathnayake     $                   + gf(1,iq,iy,iz,e) * dxm1(iq,ix)**2
86a4271fSThilina Rathnayake     $                   + gf(2,ix,iq,iz,e) * dxm1(iq,iy)**2
86a4271fSThilina Rathnayake     $                   + gf(3,ix,iy,iq,e) * dxm1(iq,iz)**2
86a4271fSThilina Rathnayake  320    continue
86a4271fSThilina RathnayakeC
86a4271fSThilina RathnayakeC        Add cross terms if element is deformed.
86a4271fSThilina RathnayakeC
86a4271fSThilina Rathnayake         if (lxyz.gt.0) then
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake           do i2=1,ly1,ly1-1
86a4271fSThilina Rathnayake           do i1=1,lx1,lx1-1
86a4271fSThilina Rathnayake              d(1,i1,i2,e) = d(1,i1,i2,e)
86a4271fSThilina Rathnayake     $            + gf(4,1,i1,i2,e) * dxtm1(1,1)*dytm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(5,1,i1,i2,e) * dxtm1(1,1)*dztm1(i2,i2)
86a4271fSThilina Rathnayake              d(lx1,i1,i2,e) = d(lx1,i1,i2,e)
86a4271fSThilina Rathnayake     $            + gf(4,lx1,i1,i2,e) * dxtm1(lx1,lx1)*dytm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(5,lx1,i1,i2,e) * dxtm1(lx1,lx1)*dztm1(i2,i2)
86a4271fSThilina Rathnayake              d(i1,1,i2,e) = d(i1,1,i2,e)
86a4271fSThilina Rathnayake     $            + gf(4,i1,1,i2,e) * dytm1(1,1)*dxtm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(6,i1,1,i2,e) * dytm1(1,1)*dztm1(i2,i2)
86a4271fSThilina Rathnayake              d(i1,ly1,i2,e) = d(i1,ly1,i2,e)
86a4271fSThilina Rathnayake     $            + gf(4,i1,ly1,i2,e) * dytm1(ly1,ly1)*dxtm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(6,i1,ly1,i2,e) * dytm1(ly1,ly1)*dztm1(i2,i2)
86a4271fSThilina Rathnayake              d(i1,i2,1,e) = d(i1,i2,1,e)
86a4271fSThilina Rathnayake     $            + gf(5,i1,i2,1,e) * dztm1(1,1)*dxtm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(6,i1,i2,1,e) * dztm1(1,1)*dytm1(i2,i2)
86a4271fSThilina Rathnayake              d(i1,i2,lz1,e) = d(i1,i2,lz1,e)
86a4271fSThilina Rathnayake     $            + gf(5,i1,i2,lz1,e) * dztm1(lz1,lz1)*dxtm1(i1,i1)
86a4271fSThilina Rathnayake     $            + gf(6,i1,i2,lz1,e) * dztm1(lz1,lz1)*dytm1(i2,i2)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake           enddo
86a4271fSThilina Rathnayake           enddo
86a4271fSThilina Rathnayake         endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake        do i=1,lxyz
86a4271fSThilina Rathnayake           d(i,1,1,e)=d(i,1,1,e)*h1(i,e)+h2(i,e)*bm1(i,1,1,e)
86a4271fSThilina Rathnayake        enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake 1000 continue ! element loop
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     If axisymmetric, add a diagonal term in the radial direction (ISD=2)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (ifaxis.and.(isd.eq.2)) then
86a4271fSThilina Rathnayake         do 1200 e=1,nel
86a4271fSThilina Rathnayake            if (ifrzer(e)) call mxm(ym1(1,1,1,e),lx1,datm1,ly1,ysm1,1)
86a4271fSThilina Rathnayake            k=0
86a4271fSThilina Rathnayake            do 1190 j=1,ly1
86a4271fSThilina Rathnayake            do 1190 i=1,lx1
86a4271fSThilina Rathnayake               k=k+1
86a4271fSThilina Rathnayake               if (ym1(i,j,1,e).ne.0.) then
86a4271fSThilina Rathnayake                  term1 = bm1(i,j,1,e)/ym1(i,j,1,e)**2
86a4271fSThilina Rathnayake                  if (ifrzer(e)) then
86a4271fSThilina Rathnayake                     term2 =  wxm1(i)*wam1(1)*dam1(1,j)
86a4271fSThilina Rathnayake     $                       *jacm1(i,1,1,e)/ysm1(i)
86a4271fSThilina Rathnayake                  else
86a4271fSThilina Rathnayake                     term2 = 0.
86a4271fSThilina Rathnayake                  endif
86a4271fSThilina Rathnayake                  d(i,j,1,e) = d(i,j,1,e) + h1(k,e)*(term1+term2)
86a4271fSThilina Rathnayake               endif
86a4271fSThilina Rathnayake 1190       continue
86a4271fSThilina Rathnayake 1200    continue
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake      call dssum   (d,nx1,ny1,nz1)
86a4271fSThilina Rathnayake      call invcol1 (d,n)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nio.eq.0) write(6,1) n,d(1,1,1,1),h1(1,1),h2(1,1),bm1(1,1,1,1)
86a4271fSThilina Rathnayake   1  format(i9,1p4e12.4,' diag prec')
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine setprecn_bp3 (d,h1,h2)
86a4271fSThilina RathnayakeC     Generate dummy diagonal preconditioner for Helmholtz operator
86a4271fSThilina RathnayakeC     Input: h1,h2                  Output: d
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (n=lx1*ly1*lz1*lelt)
86a4271fSThilina Rathnayake      real*8 d(n),h1(n),h2(n)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call rone (d,n)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine userchk
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      integer bp
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call get_bp(bp)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (bp==1) then
86a4271fSThilina Rathnayake        if (istep.gt.0) call bp1
86a4271fSThilina Rathnayake      elseif (bp==3) then
86a4271fSThilina Rathnayake        if (istep.gt.0) call bp3
86a4271fSThilina Rathnayake      else
86a4271fSThilina Rathnayake        write(6,*) "INVALID BP SPECIFICED"
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine bp1
86a4271fSThilina RathnayakeC     Solution to BP1 using libCEED
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'CTIMER'  ! ifsync
86a4271fSThilina Rathnayake      include 'FDMH1'
*ec3da8bcSJed Brown      include 'ceed/fortran.h'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lzq=lx1+1)
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1,lg=3+3*(ldim-2),lq=lzq**ldim)
86a4271fSThilina Rathnayake      common /bpgfactors/ gf(lg*lq,lelt),bmq(lq,lelt),w3mq(lq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lt=lx1*ly1*lz1*lelt)
86a4271fSThilina Rathnayake      parameter (ld=lxd*lyd*lzd*lelt)
86a4271fSThilina Rathnayake      common /vcrns/ u1(lt),r1(lt),r2(lt),r3(lt)
86a4271fSThilina Rathnayake      common /vcrny/ e1(lt)
86a4271fSThilina Rathnayake      common /vcrvh/ h1(lt),h2(lx*lelt),pap(3)
86a4271fSThilina Rathnayake      real*8 coords(ldim*lx*lelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      logical ifh3
e2b2c771Svaleria      integer*8 nnode
86a4271fSThilina Rathnayake      integer ceed,err,test
86a4271fSThilina Rathnayake      character*64 spec
86a4271fSThilina Rathnayake
34d77899SValeria Barra      integer p,q,ncompx,ncompu,enode,lnode
86a4271fSThilina Rathnayake      integer vec_p1,vec_ap1,vec_qdata,vec_coords,vec_rhs
7509a596Sjeremylt      integer stridesu(3),stridesx(3),stridesw(3)
86a4271fSThilina Rathnayake      integer erstrctu,erstrctx,erstrctw
86a4271fSThilina Rathnayake      integer basisu,basisx
86a4271fSThilina Rathnayake      integer qf_mass,qf_setup
86a4271fSThilina Rathnayake      integer op_mass,op_setup
86a4271fSThilina Rathnayake      real*8  x,y,z
86a4271fSThilina Rathnayake      integer*8 offset
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      external massf,masssetupf
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ifield = 1
86a4271fSThilina Rathnayake      nxq    = nx1+1
86a4271fSThilina Rathnayake      n = nx1*ny1*nz1*nelt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ifsync = .false.
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up coordinates
86a4271fSThilina Rathnayake      ii=0
86a4271fSThilina Rathnayake      do j=0,nelt-1
86a4271fSThilina Rathnayake      do i=1,lx
86a4271fSThilina Rathnayake        ii=ii+1
86a4271fSThilina Rathnayake        x = xm1(ii,1,1,1)
86a4271fSThilina Rathnayake        y = ym1(ii,1,1,1)
86a4271fSThilina Rathnayake        z = zm1(ii,1,1,1)
86a4271fSThilina Rathnayake        coords(i+0*lx+3*j*lx)=x
86a4271fSThilina Rathnayake        coords(i+1*lx+3*j*lx)=y
86a4271fSThilina Rathnayake        coords(i+2*lx+3*j*lx)=z
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Init ceed library
86a4271fSThilina Rathnayake      call get_spec(spec)
86a4271fSThilina Rathnayake      call ceedinit(trim(spec)//char(0),ceed,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call get_test(test)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up Nek geometry data
86a4271fSThilina Rathnayake      call geodatq       (gf,bmq,w3mq,nxq)         ! Set up gf() arrays
86a4271fSThilina Rathnayake      call set_h2_as_rhoJac_GL(h2,bmq,nxq)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up true soln
86a4271fSThilina Rathnayake      call dist_fld_h1   (e1)
86a4271fSThilina Rathnayake      call copy          (h1,e1,n)                 ! Save exact soln in h1
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up solver parameters
86a4271fSThilina Rathnayake      tol       = 1e-10
86a4271fSThilina Rathnayake      param(22) = tol
86a4271fSThilina Rathnayake      maxit     = 100
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call nekgsync()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed basis for mesh and computation
86a4271fSThilina Rathnayake      p=nx1
86a4271fSThilina Rathnayake      q=p+1
34d77899SValeria Barra      ncompu=1
34d77899SValeria Barra      ncompx=ldim
86a4271fSThilina Rathnayake      call ceedbasiscreatetensorh1lagrange(ceed,ndim,ndim,p,q,
86a4271fSThilina Rathnayake     $  ceed_gauss,basisx,err)
34d77899SValeria Barra      call ceedbasiscreatetensorh1lagrange(ceed,ndim,ncompu,p,q,
86a4271fSThilina Rathnayake     $  ceed_gauss,basisu,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed element restrictions for mesh and computation
e2b2c771Svaleria      enode=p**ldim
34d77899SValeria Barra      lnode=enode*nelt*ncompu
7509a596Sjeremylt      stridesx=[1,enode,enode*ldim]
d979a051Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,enode,ldim,
d979a051Sjeremylt     $  ldim*lnode,stridesx,erstrctx,err)
7509a596Sjeremylt      stridesu=[1,enode,enode*ncompu]
d979a051Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,enode,ncompu,
d979a051Sjeremylt     $  ncompu*lnode,stridesu,erstrctu,err)
7509a596Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,q**ldim,
d979a051Sjeremylt     $  1,nelt*q**ldim,ceed_strides_backend,erstrctw,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed vectors
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_p1,err)
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_ap1,err)
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_rhs,err)
86a4271fSThilina Rathnayake      call ceedvectorcreate(ceed,ldim*lx*nelt,vec_coords,err)
86a4271fSThilina Rathnayake      call ceedvectorcreate(ceed,nelt*q**ldim,vec_qdata,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      offset=0
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_coords,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,coords,offset,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed qfunctions for masssetupf and massf
86a4271fSThilina Rathnayake      call ceedqfunctioncreateinterior(ceed,1,masssetupf,
2d50dd3dSjeremylt     $  EXAMPLE_DIR
2d50dd3dSjeremylt     $  //'bps/bps.h:masssetupf',qf_setup,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'x',ncompx,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'dx',ncompx*ldim,
86a4271fSThilina Rathnayake     $  ceed_eval_grad,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'weight',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_weight,err)
a2fa7910SValeria Barra      call ceedqfunctionaddoutput(qf_setup,'qdata',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_none,err)
34d77899SValeria Barra      call ceedqfunctionaddoutput(qf_setup,'rhs',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call ceedqfunctioncreateinterior(ceed,1,massf,
2d50dd3dSjeremylt     $  EXAMPLE_DIR
2d50dd3dSjeremylt     $  //'bps/bps.h:massf',qf_mass,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_mass,'u',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
a2fa7910SValeria Barra      call ceedqfunctionaddinput(qf_mass,'qdata',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_none,err)
34d77899SValeria Barra      call ceedqfunctionaddoutput(qf_mass,'v',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed operators
86a4271fSThilina Rathnayake      call ceedoperatorcreate(ceed,qf_setup,
442e7f0bSjeremylt     $  ceed_qfunction_none,ceed_qfunction_none,op_setup,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'x',erstrctx,
a8d32208Sjeremylt     $  basisx,ceed_vector_active,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'dx',erstrctx,
a8d32208Sjeremylt     $  basisx,ceed_vector_active,err)
15910d16Sjeremylt      call ceedoperatorsetfield(op_setup,'weight',
15910d16Sjeremylt     $  ceed_elemrestriction_none,basisx,ceed_vector_none,err)
a2fa7910SValeria Barra      call ceedoperatorsetfield(op_setup,'qdata',erstrctw,
a8d32208Sjeremylt     $  ceed_basis_collocated,ceed_vector_active,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'rhs',erstrctu,
a8d32208Sjeremylt     $  basisu,vec_rhs,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call ceedoperatorcreate(ceed,qf_mass,
442e7f0bSjeremylt     $  ceed_qfunction_none,ceed_qfunction_none,op_mass,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_mass,'u',erstrctu,
a8d32208Sjeremylt     $  basisu,ceed_vector_active,err)
a2fa7910SValeria Barra      call ceedoperatorsetfield(op_mass,'qdata',erstrctw,
a8d32208Sjeremylt     $  ceed_basis_collocated,vec_qdata,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_mass,'v',erstrctu,
a8d32208Sjeremylt     $  basisu,ceed_vector_active,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Compute setup data
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_rhs,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,r1,offset,err)
86a4271fSThilina Rathnayake      call ceedoperatorapply(op_setup,vec_coords,vec_qdata,
86a4271fSThilina Rathnayake     $  ceed_request_immediate,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up true RHS
86a4271fSThilina Rathnayake      call dssum         (r1,nx1,ny1,nz1)          ! r1
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up algebraic RHS with libCEED
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_p1,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,h1,offset,err)
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_ap1,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,r2,offset,err)
86a4271fSThilina Rathnayake      call ceedoperatorapply(op_mass,vec_p1,vec_ap1,
86a4271fSThilina Rathnayake     $  ceed_request_immediate,err)                ! r2 = A_ceed*h1
86a4271fSThilina Rathnayake      call dssum         (r2,nx1,ny1,nz1)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up algebraic RHS with Nek5000
86a4271fSThilina Rathnayake      call axhm1         (pap,r3,h1,h1,h2,'bp1')   ! r3 = A_nek5k*h1
86a4271fSThilina Rathnayake      call dssum         (r3,nx1,ny1,nz1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call nekgsync()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve true RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "libCEED true RHS"
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r1,h1,h2,vmult,binvm1,tol,ceed,op_mass,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp1')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>5e-3) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx     = nx1-1
e2b2c771Svaleria      nnode  = nelgt            ! nnodes
e2b2c771Svaleria      nnode  = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp   = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
05939c60Sjeremylt      dofps  = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
05939c60Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve libCEED algebraic RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "libCEED algebraic RHS"
86a4271fSThilina Rathnayake      maxit = 100
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r2,h1,h2,vmult,binvm1,tol,ceed,op_mass,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp1')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>1e-5) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx      = nx1-1
e2b2c771Svaleria      nnode   = nelgt            ! nnodes
e2b2c771Svaleria      nnode   = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp    = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
05939c60Sjeremylt      dofps   = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers  = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s  = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
05939c60Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve Nek5000 algebraic RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "Nek5000 algebraic RHS"
86a4271fSThilina Rathnayake      maxit = 100
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r3,h1,h2,vmult,binvm1,tol,ceed,op_mass,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp1')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>1e-5) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx      = nx1-1
e2b2c771Svaleria      nnode   = nelgt            ! nnodes
e2b2c771Svaleria      nnode   = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp    = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
05939c60Sjeremylt      dofps   = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers  = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s  = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
05939c60Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake    1 format(a12,i7,i3,i7,i10,i14,i10,i4,1p4e13.5)
86a4271fSThilina Rathnayake    3 format(i3,i9,e12.4,1x,a8,i9)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Destroy ceed handles
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_p1,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_ap1,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_rhs,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_qdata,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_coords,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctu,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctx,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctw,err)
86a4271fSThilina Rathnayake      call ceedbasisdestroy(basisu,err)
86a4271fSThilina Rathnayake      call ceedbasisdestroy(basisx,err)
86a4271fSThilina Rathnayake      call ceedqfunctiondestroy(qf_setup,err)
86a4271fSThilina Rathnayake      call ceedqfunctiondestroy(qf_mass,err)
86a4271fSThilina Rathnayake      call ceedoperatordestroy(op_setup,err)
86a4271fSThilina Rathnayake      call ceedoperatordestroy(op_mass,err)
86a4271fSThilina Rathnayake      call ceeddestroy(ceed,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine bp3
86a4271fSThilina RathnayakeC     Solution to BP3 using libCEED
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'CTIMER'  ! ifsync
86a4271fSThilina Rathnayake      include 'FDMH1'
*ec3da8bcSJed Brown      include 'ceed/fortran.h'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lzq=lx1+1)
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1,lg=3+3*(ldim-2),lq=lzq**ldim)
86a4271fSThilina Rathnayake      common /bpgfactors/ gf(lg*lq,lelt),bmq(lq,lelt),w3mq(lq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lt=lx1*ly1*lz1*lelt)
86a4271fSThilina Rathnayake      parameter (ld=lxd*lyd*lzd*lelt)
86a4271fSThilina Rathnayake      common /vcrns/ u1(lt),r1(lt),r2(lt),r3(lt)
86a4271fSThilina Rathnayake      common /vcrny/ e1(lt)
86a4271fSThilina Rathnayake      common /vcrvh/ h1(lt),h2(ld),pap(3)
86a4271fSThilina Rathnayake      real*8 coords(ldim*lx*lelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      logical ifh3
e2b2c771Svaleria      integer*8 nnode
86a4271fSThilina Rathnayake      integer ceed,err,test
86a4271fSThilina Rathnayake      character*64 spec
86a4271fSThilina Rathnayake
34d77899SValeria Barra      integer p,q,ncompx,ncompu,enode,lnode
86a4271fSThilina Rathnayake      integer vec_p1,vec_ap1,vec_qdata,vec_coords,vec_rhs
7509a596Sjeremylt      integer stridesu(3),stridesx(3),stridesw(3)
86a4271fSThilina Rathnayake      integer erstrctu,erstrctx,erstrctw
86a4271fSThilina Rathnayake      integer basisu,basisx
86a4271fSThilina Rathnayake      integer qf_diffusion,qf_setup
86a4271fSThilina Rathnayake      integer op_diffusion,op_setup
86a4271fSThilina Rathnayake      integer ii,i,ngeo
86a4271fSThilina Rathnayake      real*8  x,y,z
86a4271fSThilina Rathnayake      integer*8 offset
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      external diffusionf,diffsetupf
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ifield = 1
86a4271fSThilina Rathnayake      nxq    = nx1+1
86a4271fSThilina Rathnayake      n = nx1*ny1*nz1*nelt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      ifsync = .false.
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up coordinates and mask
86a4271fSThilina Rathnayake      ii=0
86a4271fSThilina Rathnayake      do j=0,nelt-1
86a4271fSThilina Rathnayake      do i=1,lx
86a4271fSThilina Rathnayake        ii=ii+1
86a4271fSThilina Rathnayake        x = xm1(ii,1,1,1)
86a4271fSThilina Rathnayake        y = ym1(ii,1,1,1)
86a4271fSThilina Rathnayake        z = zm1(ii,1,1,1)
86a4271fSThilina Rathnayake        coords(i+0*lx+3*j*lx)=x
86a4271fSThilina Rathnayake        coords(i+1*lx+3*j*lx)=y
86a4271fSThilina Rathnayake        coords(i+2*lx+3*j*lx)=z
86a4271fSThilina Rathnayake        if ( x.eq.0.or.x.eq.1
86a4271fSThilina Rathnayake     $   .or.y.eq.0.or.y.eq.1
86a4271fSThilina Rathnayake     $   .or.z.eq.0.or.z.eq.1 ) then
86a4271fSThilina Rathnayake          h2(ii)=0.
86a4271fSThilina Rathnayake        else
86a4271fSThilina Rathnayake          h2(ii)=1.
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Init ceed library
86a4271fSThilina Rathnayake      call get_spec(spec)
86a4271fSThilina Rathnayake      call ceedinit(trim(spec)//char(0),ceed,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call get_test(test)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up Nek geometry data
86a4271fSThilina Rathnayake      call geodatq       (gf,bmq,w3mq,nxq)         ! Set up gf() arrays
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up true soln
86a4271fSThilina Rathnayake      call sin_fld_h1    (e1)
86a4271fSThilina Rathnayake      call xmask1        (e1,h2,nelt)
86a4271fSThilina Rathnayake      call copy          (h1,e1,n)                 ! Save exact soln in h1
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up solver parameters
86a4271fSThilina Rathnayake      tol       = 1e-10
86a4271fSThilina Rathnayake      param(22) = tol
86a4271fSThilina Rathnayake      maxit     = 100
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call nekgsync()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed basis for mesh and computation
86a4271fSThilina Rathnayake      p=nx1
86a4271fSThilina Rathnayake      q=p+1
34d77899SValeria Barra      ncompu=1
34d77899SValeria Barra      ncompx=ldim
34d77899SValeria Barra      call ceedbasiscreatetensorh1lagrange(ceed,ldim,ncompx,p,q,
86a4271fSThilina Rathnayake     $  ceed_gauss,basisx,err)
34d77899SValeria Barra      call ceedbasiscreatetensorh1lagrange(ceed,ldim,ncompu,p,q,
86a4271fSThilina Rathnayake     $  ceed_gauss,basisu,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed element restrictions for mesh and computation
e2b2c771Svaleria      enode=p**ldim
34d77899SValeria Barra      lnode=enode*nelt*ncompu
86a4271fSThilina Rathnayake      ngeo=(ldim*(ldim+1))/2
7509a596Sjeremylt      stridesx=[1,enode,enode*ldim]
d979a051Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,enode,ldim,
d979a051Sjeremylt     $  ldim*lnode,stridesx,erstrctx,err)
7509a596Sjeremylt      stridesu=[1,enode,enode*ncompu]
d979a051Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,enode,ncompu,
d979a051Sjeremylt     $  ncompu*lnode,stridesu,erstrctu,err)
7509a596Sjeremylt      stridesw=[1,q**ldim,ngeo*q**ldim]
7509a596Sjeremylt      call ceedelemrestrictioncreatestrided(ceed,nelt,q**ldim,
d979a051Sjeremylt     $  ngeo,nelt*q**ldim*ngeo,stridesw,erstrctw,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed vectors
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_p1,err)
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_ap1,err)
e2b2c771Svaleria      call ceedvectorcreate(ceed,lnode,vec_rhs,err)
86a4271fSThilina Rathnayake      call ceedvectorcreate(ceed,ldim*lx*nelt,vec_coords,err)
86a4271fSThilina Rathnayake      call ceedvectorcreate(ceed,nelt*ngeo*q**ldim,vec_qdata,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      offset=0
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_coords,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,coords,offset,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed qfunctions for diffsetupf and diffusionf
86a4271fSThilina Rathnayake      call ceedqfunctioncreateinterior(ceed,1,diffsetupf,
2d50dd3dSjeremylt     $  EXAMPLE_DIR
2d50dd3dSjeremylt     $  //'bps/bps.h:diffsetupf'//char(0),qf_setup,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'x',ncompx,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'dx',ncompx*ldim,
86a4271fSThilina Rathnayake     $  ceed_eval_grad,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_setup,'weight',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_weight,err)
a2fa7910SValeria Barra      call ceedqfunctionaddoutput(qf_setup,'qdata',ngeo,
86a4271fSThilina Rathnayake     $  ceed_eval_none,err)
34d77899SValeria Barra      call ceedqfunctionaddoutput(qf_setup,'rhs',ncompu,
86a4271fSThilina Rathnayake     $  ceed_eval_interp,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call ceedqfunctioncreateinterior(ceed,1,diffusionf,
2d50dd3dSjeremylt     $  EXAMPLE_DIR
2d50dd3dSjeremylt     $  //'bps/bps.h:diffusionf'//char(0),qf_diffusion,err)
34d77899SValeria Barra      call ceedqfunctionaddinput(qf_diffusion,'u',ncompu*ldim,
86a4271fSThilina Rathnayake     $  ceed_eval_grad,err)
a2fa7910SValeria Barra      call ceedqfunctionaddinput(qf_diffusion,'qdata',ngeo,
86a4271fSThilina Rathnayake     $  ceed_eval_none,err)
34d77899SValeria Barra      call ceedqfunctionaddoutput(qf_diffusion,'v',ncompu*ldim,
86a4271fSThilina Rathnayake     $  ceed_eval_grad,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Create ceed operators
86a4271fSThilina Rathnayake      call ceedoperatorcreate(ceed,qf_setup,
442e7f0bSjeremylt     $  ceed_qfunction_none,ceed_qfunction_none,op_setup,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'x',erstrctx,
a8d32208Sjeremylt     $  basisx,ceed_vector_active,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'dx',erstrctx,
a8d32208Sjeremylt     $  basisx,ceed_vector_active,err)
15910d16Sjeremylt      call ceedoperatorsetfield(op_setup,'weight',
15910d16Sjeremylt     $  ceed_elemrestriction_none,basisx,ceed_vector_none,err)
a2fa7910SValeria Barra      call ceedoperatorsetfield(op_setup,'qdata',erstrctw,
a8d32208Sjeremylt     $  ceed_basis_collocated,ceed_vector_active,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_setup,'rhs',erstrctu,
a8d32208Sjeremylt     $  basisu,vec_rhs,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call ceedoperatorcreate(ceed,qf_diffusion,
61dbc9d2Sjeremylt     $  ceed_qfunction_none,ceed_qfunction_none,op_diffusion,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_diffusion,'u',erstrctu,
a8d32208Sjeremylt     $  basisu,ceed_vector_active,err)
a2fa7910SValeria Barra      call ceedoperatorsetfield(op_diffusion,'qdata',erstrctw,
a8d32208Sjeremylt     $  ceed_basis_collocated,vec_qdata,err)
86a4271fSThilina Rathnayake      call ceedoperatorsetfield(op_diffusion,'v',erstrctu,
a8d32208Sjeremylt     $  basisu,ceed_vector_active,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Compute setup data
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_rhs,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,r1,offset,err)
86a4271fSThilina Rathnayake      call ceedoperatorapply(op_setup,vec_coords,vec_qdata,
86a4271fSThilina Rathnayake     $  ceed_request_immediate,err)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up true RHS
86a4271fSThilina Rathnayake      call dssum         (r1,nx1,ny1,nz1)          ! r1
86a4271fSThilina Rathnayake      call xmask1        (r1,h2,nelt)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up algebraic RHS with libCEED
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_p1,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,h1,offset,err)
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_ap1,ceed_mem_host,
86a4271fSThilina Rathnayake     $  ceed_use_pointer,r2,offset,err)
86a4271fSThilina Rathnayake      call ceedoperatorapply(op_diffusion,vec_p1,vec_ap1,
86a4271fSThilina Rathnayake     $  ceed_request_immediate,err)                ! r2 = A_ceed*h1
86a4271fSThilina Rathnayake      call dssum         (r2,nx1,ny1,nz1)
86a4271fSThilina Rathnayake      call xmask1        (r2,h2,nelt)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Set up algebraic RHS with Nek5000
86a4271fSThilina Rathnayake      call axhm1         (pap,r3,h1,h1,h2,'bp3')   ! r3 = A_nek5k*h1
86a4271fSThilina Rathnayake      call dssum         (r3,nx1,ny1,nz1)
86a4271fSThilina Rathnayake      call xmask1        (r3,h2,nelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call nekgsync()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve true RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "libCEED true RHS"
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r1,h1,h2,vmult,binvm1,tol,ceed,op_diffusion,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp3')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>1e-3) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx      = nx1-1
e2b2c771Svaleria      nnode   = nelgt            ! nnodes
e2b2c771Svaleria      nnode   = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp    = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
05939c60Sjeremylt      dofps   = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers  = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s  = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
05939c60Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve libCEED algebraic RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "libCEED algebraic RHS"
86a4271fSThilina Rathnayake      maxit = 100
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r2,h1,h2,vmult,binvm1,tol,ceed,op_diffusion,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp3')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>1e-9) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx      = nx1-1
e2b2c771Svaleria      nnode   = nelgt            ! nnodes
e2b2c771Svaleria      nnode   = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp    = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
05939c60Sjeremylt      dofps   = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers  = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s  = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
05939c60Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Solve Nek5000 algebraic RHS
86a4271fSThilina Rathnayake      if (nid.eq.0) write (6,*) "Nek5000 algebraic RHS"
86a4271fSThilina Rathnayake      maxit = 100
86a4271fSThilina Rathnayake      tstart = dnekclock()
86a4271fSThilina Rathnayake      call cggos(u1,r3,h1,h2,vmult,binvm1,tol,ceed,op_diffusion,
86a4271fSThilina Rathnayake     $  vec_p1,vec_ap1,maxit,'bp3')
86a4271fSThilina Rathnayake      tstop  = dnekclock()
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Output
86a4271fSThilina Rathnayake      telaps = (tstop-tstart)
86a4271fSThilina Rathnayake      maxits = maxit
86a4271fSThilina Rathnayake      er1 = glrdif(u1,e1,n)
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,3) lx1,nelgv,er1,' error ',maxit
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (test.eq.1.and.nid.eq.0) then
86a4271fSThilina Rathnayake        if (maxit>=100) then
86a4271fSThilina Rathnayake          write(6,*) "UNCONVERGED CG"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake        if (dabs(er1)>1e-9) then
86a4271fSThilina Rathnayake          write(6,*) "ERROR IS TOO LARGE"
86a4271fSThilina Rathnayake        endif
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nx      = nx1-1
e2b2c771Svaleria      nnode   = nelgt            ! nnodes
e2b2c771Svaleria      nnode   = nnode*(nx**ldim) ! nnodes
e2b2c771Svaleria      nppp    = nnode/np         ! nnodes/proc
86a4271fSThilina Rathnayake
61dbc9d2Sjeremylt      dofps   = nnode/telaps     ! DOF/sec - scalar form
86a4271fSThilina Rathnayake      titers  = telaps/maxits    ! time per iteration
86a4271fSThilina Rathnayake      tppp_s  = titers/nppp      ! time per iteraton per local point
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (nid.eq.0) write(6,1) 'case scalar:'
61dbc9d2Sjeremylt     $ ,np,nx,nelt,nelgt,nnode,nppp,maxits,telaps,dofps,titers,tppp_s
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake    1 format(a12,i7,i3,i7,i10,i14,i10,i4,1p4e13.5)
86a4271fSThilina Rathnayake    3 format(i3,i9,e12.4,1x,a8,i9)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     Destroy ceed handles
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_p1,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_ap1,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_rhs,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_qdata,err)
86a4271fSThilina Rathnayake      call ceedvectordestroy(vec_coords,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctu,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctx,err)
86a4271fSThilina Rathnayake      call ceedelemrestrictiondestroy(erstrctw,err)
86a4271fSThilina Rathnayake      call ceedbasisdestroy(basisu,err)
86a4271fSThilina Rathnayake      call ceedbasisdestroy(basisx,err)
86a4271fSThilina Rathnayake      call ceedqfunctiondestroy(qf_setup,err)
86a4271fSThilina Rathnayake      call ceedqfunctiondestroy(qf_diffusion,err)
86a4271fSThilina Rathnayake      call ceedoperatordestroy(op_setup,err)
86a4271fSThilina Rathnayake      call ceedoperatordestroy(op_diffusion,err)
86a4271fSThilina Rathnayake      call ceeddestroy(ceed,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine cggos(u1,r1,h1,h2,rmult,binv,tin,ceed,ceed_op,vec_p1,
86a4271fSThilina Rathnayake     $  vec_ap1,maxit,bpname)
86a4271fSThilina RathnayakeC     Scalar conjugate gradient iteration for solution of uncoupled
86a4271fSThilina RathnayakeC     Helmholtz equations
86a4271fSThilina RathnayakeC     Input: r1,h1,h2,rmult,binv,tin,ceed,ceed_op,vec_p1,vec_ap1,bpname
86a4271fSThilina RathnayakeC     Output: u1,maxit
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake      include 'DOMAIN'
86a4271fSThilina Rathnayake      include 'FDMH1'
86a4271fSThilina Rathnayake      character*3 bpname
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC     INPUT:  rhs1 - rhs
86a4271fSThilina RathnayakeC             h1   - exact solution
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lt=lx1*ly1*lz1*lelt)
86a4271fSThilina Rathnayake      parameter (ld=lxd*lyd*lzd*lelt)
86a4271fSThilina Rathnayake      real*8 u1(lt),r1(lt),h1(lt),h2(lt)
86a4271fSThilina Rathnayake      real*8 rmult(1),binv(1)
86a4271fSThilina Rathnayake      integer ceed,ceed_op,vec_ap1,vec_p1
86a4271fSThilina Rathnayake      common /scrcg/ dpc(lt),p1(lt),z1(lt)
86a4271fSThilina Rathnayake      common /scrca/ wv(4),wk(4),rpp1(4),rpp2(4),alph(4),beta(4),pap(4)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 ap1(lt)
86a4271fSThilina Rathnayake      equivalence (ap1,z1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      vol   = volfld(ifield)
86a4271fSThilina Rathnayake      nel   = nelfld(ifield)
86a4271fSThilina Rathnayake      nxyz  = lx1*ly1*lz1
86a4271fSThilina Rathnayake      n     = nxyz*nel
86a4271fSThilina Rathnayake      nx    = nx1-1                  ! Polynomial order (just for i/o)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      tol=tin
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if(bpname.ne.'bp1') then
86a4271fSThilina Rathnayake        call setprecn_bp3(dpc,h1,h2) ! Set up diagional pre-conidtioner
86a4271fSThilina Rathnayake      else
86a4271fSThilina Rathnayake        call setprecn_bp1(dpc,h1,h2) ! Set up diagional pre-conidtioner
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call rzero         (u1,n)      ! Initialize solution
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      wv(1)=0
86a4271fSThilina Rathnayake      do i=1,n
86a4271fSThilina Rathnayake         s=rmult(i)                  !      -1
86a4271fSThilina Rathnayake         p1(i)=dpc(i)*r1(i)          ! p = M  r      T
86a4271fSThilina Rathnayake         wv(1)=wv(1)+s*p1(i)*r1(i)   !              r p
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      call gop(wv(1),wk,'+  ',1)
86a4271fSThilina Rathnayake      rpp1(1) = wv  (1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do 1000 iter=1,maxit
86a4271fSThilina Rathnayake         call axhm1_ceed (pap,ap1,p1,h1,h2,ceed,ceed_op,
86a4271fSThilina Rathnayake     $     vec_ap1,vec_p1)
86a4271fSThilina Rathnayake         call dssum    (ap1,nx1,ny1,nz1)
86a4271fSThilina Rathnayake         if (bpname.ne.'bp1') call xmask1(ap1,h2,nel)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         call gop      (pap,wk,'+  ',1)
86a4271fSThilina Rathnayake         alph(1) = rpp1(1)/pap(1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         do i=1,n
86a4271fSThilina Rathnayake            u1(i)=u1(i)+alph(1)* p1(i)
86a4271fSThilina Rathnayake            r1(i)=r1(i)-alph(1)*ap1(i)
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC        tolerance check here
86a4271fSThilina Rathnayake         call rzero(wv,2)
86a4271fSThilina Rathnayake         do i=1,n
86a4271fSThilina Rathnayake            wv(1)=wv(1)+r1(i)*r1(i)            ! L2 error estimate
86a4271fSThilina Rathnayake            z1(i)=dpc(i)*r1(i)                 ! z = M  r
86a4271fSThilina Rathnayake            wv(2)=wv(2)+rmult(i)*z1(i)*r1(i)   ! r z
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake         call gop(wv,wk,'+  ',2)
86a4271fSThilina Rathnayake
86a4271fSThilina RathnayakeC        if (nio.eq.0) write(6,1) ifield,istep,iter,nx,(wv(k),k=1,1)
86a4271fSThilina Rathnayake  1     format(i2,i9,i5,i4,1p1e12.4,' cggos')
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         enorm=sqrt(wv(1))
86a4271fSThilina Rathnayake         if (enorm.lt.tol) then
86a4271fSThilina Rathnayake            ifin = iter
86a4271fSThilina Rathnayake            if (nio.eq.0) write(6,3000) istep,ifin,enorm,tol
86a4271fSThilina Rathnayake            goto 9999
86a4271fSThilina Rathnayake         endif
86a4271fSThilina RathnayakeC        if (nio.eq.0) write(6,2) iter,enorm,alph(1),pap(1),'alpha'
86a4271fSThilina Rathnayake 2      format(i5,1p3e12.4,2x,a5)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         rpp2(1)=rpp1(1)
86a4271fSThilina Rathnayake         rpp1(1)=wv  (2)
86a4271fSThilina Rathnayake         beta1  =rpp1(1)/rpp2(1)
86a4271fSThilina Rathnayake         do i=1,n
86a4271fSThilina Rathnayake            p1(i)=z1(i) + beta1*p1(i)
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake 1000 continue
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      rbnorm=sqrt(wv(1))
86a4271fSThilina Rathnayake      if (nio.eq.0) write (6,3001) istep,iter,rbnorm,tol
86a4271fSThilina Rathnayake      iter = iter-1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake 9999 continue
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      maxit=iter
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake 3000 format(i12,1x,'cggo scalar:',i6,1p5e13.4)
86a4271fSThilina Rathnayake 3001 format(2i6,' Unconverged cggo scalar: rbnorm =',1p2e13.6)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine axhm1_ceed(pap,ap1,p1,h1,h2,ceed,ceed_op,
86a4271fSThilina Rathnayake     $  vec_ap1,vec_p1)
86a4271fSThilina RathnayakeC     Vector conjugate gradient matvec for solution of uncoupled
86a4271fSThilina RathnayakeC     Helmholtz equations
86a4271fSThilina RathnayakeC     Input: pap,p1,h1,h2,bpname,ceed,ceed_op,vec_ap1,vec_p1
86a4271fSThilina RathnayakeC     Output: ap1
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
*ec3da8bcSJed Brown      include 'ceed/fortran.h'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1,lg=3+3*(ldim-2))
86a4271fSThilina Rathnayake      real*8       gf(lg,lx,lelt)             ! Equivalence new gf() data
86a4271fSThilina Rathnayake      equivalence (gf,g1m1)                   ! layout to g1m1...g6m1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8   pap(3)
86a4271fSThilina Rathnayake      real*8   ap1(lx,lelt)
86a4271fSThilina Rathnayake      real*8    p1(lx,lelt)
86a4271fSThilina Rathnayake      real*8    h1(lx,lelt),h2(lx,lelt)
86a4271fSThilina Rathnayake      integer ceed,ceed_op,vec_ap1,vec_p1,err
86a4271fSThilina Rathnayake      integer i,e
86a4271fSThilina Rathnayake      integer*8 offset
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      offset=0
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_p1,ceed_mem_host,ceed_use_pointer,
86a4271fSThilina Rathnayake     $  p1,offset,err)
86a4271fSThilina Rathnayake      call ceedvectorsetarray(vec_ap1,ceed_mem_host,ceed_use_pointer,
86a4271fSThilina Rathnayake     $  ap1,offset,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call ceedoperatorapply(ceed_op,vec_p1,vec_ap1,
86a4271fSThilina Rathnayake     $  ceed_request_immediate,err)
86a4271fSThilina Rathnayake
6a6c615bSJeremy L Thompson      call ceedvectortakearray(vec_p1,ceed_mem_host,0,offset,err)
6a6c615bSJeremy L Thompson      call ceedvectortakearray(vec_ap1,ceed_mem_host,0,offset,err)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      pap(1)=0.
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do e=1,nelt
86a4271fSThilina Rathnayake         do i=1,lx
86a4271fSThilina Rathnayake           pap(1)=pap(1)+ap1(i,e)*p1(i,e)
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine ax_e_bp1(w,u,g,h1,h2,b,ju,us,ut)
86a4271fSThilina RathnayakeC     Local matrix-vector for solution of BP3 (stiffness matrix)
86a4271fSThilina RathnayakeC     Input: u,g,h1,h2,b,ju,us,ut   Output: w
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lxyz=lx1*ly1*lz1,lg=3+3*(ldim-2))
86a4271fSThilina Rathnayake      real*8 w(lxyz),u(lxyz),g(lg,lxyz),h1(lxyz),h2(lxyz),b(lxyz)
86a4271fSThilina Rathnayake      real*8 ju(lxyz),us(lxyz),ut(lxyz)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      nxq = nx1+1 ! Number of quadrature points
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      lxyzq = nxq**ldim
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call intp_rstd (ju,u,lx1,nxq,if3d,0) ! 0 --> Fwd interpolation
86a4271fSThilina Rathnayake      do i=1,lxyzq
86a4271fSThilina Rathnayake         ju(i)=ju(i)*h2(i) !! h2 must be on the fine grid, w/ quad wts
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake      call intp_rstd (w,ju,lx1,nxq,if3d,1) ! 1 --> ju-->u
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine axhm1_bp1(pap,ap1,p1,h1,h2)
86a4271fSThilina RathnayakeC     Vector conjugate gradient matvec for solution of BP1 (mass matrix)
86a4271fSThilina RathnayakeC     Input: pap,p1,h1,h2           Output: ap1
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1,lg=3+3*(ldim-2))
86a4271fSThilina Rathnayake      real*8         gf(lg,lx,lelt)             ! Equivalence new gf() data
86a4271fSThilina Rathnayake      equivalence (gf,g1m1)                     ! layout to g1m1...g6m1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 pap(3)
86a4271fSThilina Rathnayake      real*8 ap1(lx,lelt)
86a4271fSThilina Rathnayake      real*8  p1(lx,lelt)
86a4271fSThilina Rathnayake      real*8  h1(lx,lelt),h2(lx,lelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 ur(lx),us(lx),ut(lx)
86a4271fSThilina Rathnayake      common /ctmp1/ ur,us,ut
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      integer e
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      pap(1)=0.
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      k=1
86a4271fSThilina Rathnayake      nxq = nx1+1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do e=1,nelt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         call ax_e_bp1(ap1(1,e),p1(1,e),gf(1,1,e),h1(1,e),h2(k,1)
86a4271fSThilina Rathnayake     $                                          ,bm1(1,1,1,e),ur,us,ut)
86a4271fSThilina Rathnayake         do i=1,lx
86a4271fSThilina Rathnayake           pap(1)=pap(1)+ap1(i,e)*p1(i,e)
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake         k=k+nxq*nxq*nxq
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine ax_e_bp3(w,u,g,ur,us,ut,wk)
86a4271fSThilina RathnayakeC     Local matrix-vector for solution of BP3 (stiffness matrix)
86a4271fSThilina RathnayakeC     Input: u,g,ur,us,ut,wk        Output: w
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lzq=lx1+1,lxyz=lx1*lx1*lx1,lxyzq=lzq*lzq*lzq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      common /ctmp0/ tmp(lxyzq)
86a4271fSThilina Rathnayake      common /dxmfine/ dxmq(lzq,lzq),dxtmq(lzq,lzq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 ur(lxyzq),us(lxyzq),ut(lxyzq),wk(lxyzq)
86a4271fSThilina Rathnayake      real*8 w(lxyz),u(lxyz),g(2*ldim,lxyzq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      n = lzq-1
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call intp_rstd  (wk,u,lx1,lzq,if3d,0) ! 0 --> Fwd interpolation
86a4271fSThilina Rathnayake      call loc_grad3  (ur,us,ut,wk,n,dxmq,dxtmq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do i=1,lxyzq
86a4271fSThilina Rathnayake         wr = g(1,i)*ur(i) + g(2,i)*us(i) + g(3,i)*ut(i)
86a4271fSThilina Rathnayake         ws = g(2,i)*ur(i) + g(4,i)*us(i) + g(5,i)*ut(i)
86a4271fSThilina Rathnayake         wt = g(3,i)*ur(i) + g(5,i)*us(i) + g(6,i)*ut(i)
86a4271fSThilina Rathnayake         ur(i) = wr
86a4271fSThilina Rathnayake         us(i) = ws
86a4271fSThilina Rathnayake         ut(i) = wt
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      call loc_grad3t (wk,ur,us,ut,n,dxmq,dxtmq,tmp)
86a4271fSThilina Rathnayake      call intp_rstd  (w,wk,lx1,lzq,if3d,1) ! 1 --> ju-->u
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine axhm1_bp3(pap,ap1,p1,h1,h2)
86a4271fSThilina RathnayakeC     Vector conjugate gradient matvec for solution of BP3 (stiffness matrix)
86a4271fSThilina RathnayakeC     Input: pap,p1,h1,h2           Output: ap1
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lzq=lx1+1)
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1,lg=3+3*(ldim-2),lq=lzq**ldim)
86a4271fSThilina Rathnayake      common /bpgfactors/ gf(lg,lq,lelt),bmq(lq,lelt),w3mq(lq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 pap(3)
86a4271fSThilina Rathnayake      real*8 ap1(lx,lelt)
86a4271fSThilina Rathnayake      real*8  p1(lx,lelt)
86a4271fSThilina Rathnayake      real*8  h1(lx,lelt),h2(lx,lelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      common /ctmp1/ ur,us,ut,wk
86a4271fSThilina Rathnayake      real*8 ur(lq),us(lq),ut(lq),wk(lq)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      integer e
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      pap(1)=0.
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      do e=1,nelt
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake         call ax_e_bp3(ap1(1,e),p1(1,e),gf(1,1,e),ur,us,ut,wk)
86a4271fSThilina Rathnayake         do i=1,lx
86a4271fSThilina Rathnayake           pap(1)=pap(1)+p1(i,e)*ap1(i,e)
86a4271fSThilina Rathnayake         enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      enddo
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine axhm1(pap,ap1,p1,h1,h2,bpname)
86a4271fSThilina RathnayakeC     Vector conjugate gradient matvec for solution of uncoupled
86a4271fSThilina RathnayakeC     Helmholtz equations
86a4271fSThilina RathnayakeC     Input: pap,p1,h1,h2,bpname    Output: ap1
86a4271fSThilina Rathnayake      include 'SIZE'
86a4271fSThilina Rathnayake      include 'TOTAL'
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      parameter (lx=lx1*ly1*lz1)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      real*8 pap(3),ap1(lx,lelt),p1(lx,lelt)
86a4271fSThilina Rathnayake      real*8 h1(lx,lelt),h2(lx,lelt)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      character*3 bpname
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      if (bpname.eq.'bp1') then
86a4271fSThilina Rathnayake         call axhm1_bp1(pap,ap1,p1,h1,h2)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      elseif (bpname.eq.'bp3') then
86a4271fSThilina Rathnayake         call axhm1_bp3(pap,ap1,p1,h1,h2)
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      else
86a4271fSThilina Rathnayake         write(6,*) bpname,' axhm1 bpname error'
86a4271fSThilina Rathnayake         stop
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine get_bp(bp)
86a4271fSThilina RathnayakeC     Get BP to run
86a4271fSThilina RathnayakeC     Input:                        Output: bp
86a4271fSThilina Rathnayake      integer i,bp
86a4271fSThilina Rathnayake      character*64 bpval
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      bp=0
86a4271fSThilina Rathnayake      if(iargc().ge.1) then
86a4271fSThilina Rathnayake        call getarg(1,bpval)
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake      if(bpval.eq."bp1") then
86a4271fSThilina Rathnayake        bp=1
86a4271fSThilina Rathnayake      elseif(bpval.eq."bp3") then
86a4271fSThilina Rathnayake        bp=3
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine get_spec(spec)
86a4271fSThilina RathnayakeC     Get CEED backend specification
86a4271fSThilina RathnayakeC     Input:                        Output: spec
86a4271fSThilina Rathnayake      integer i
86a4271fSThilina Rathnayake      character*64 spec
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      spec = '/cpu/self'
86a4271fSThilina Rathnayake      if(iargc().ge.2) then
86a4271fSThilina Rathnayake        call getarg(2,spec)
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
86a4271fSThilina Rathnayake      subroutine get_test(test)
86a4271fSThilina RathnayakeC     Get test mode flag
86a4271fSThilina RathnayakeC     Input:                        Output: test
86a4271fSThilina Rathnayake      integer i,test
86a4271fSThilina Rathnayake      character*64 testval
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      test=0
86a4271fSThilina Rathnayake      if(iargc().ge.3) then
86a4271fSThilina Rathnayake        call getarg(3,testval)
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake      if(testval.eq."test") then
86a4271fSThilina Rathnayake        test=1
86a4271fSThilina Rathnayake      endif
86a4271fSThilina Rathnayake
86a4271fSThilina Rathnayake      return
86a4271fSThilina Rathnayake      end
86a4271fSThilina RathnayakeC-----------------------------------------------------------------------
61dbc9d2Sjeremylt