xref: /petsc/src/mat/utils/freespace.c (revision 0e97c5f4ea7aec56dfb77b4089b31f0ca8c13ef5)
1be1d678aSKris Buschelman #define PETSCMAT_DLL
2be1d678aSKris Buschelman 
37c4f633dSBarry Smith #include "../src/mat/utils/freespace.h"
470f19b1fSKris Buschelman 
570f19b1fSKris Buschelman #undef __FUNCT__
6a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceGet"
7a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceGet(PetscInt n,PetscFreeSpaceList *list)
82e111b49SBarry Smith {
9a1a86e44SBarry Smith   PetscFreeSpaceList a;
10dfbe8321SBarry Smith   PetscErrorCode     ierr;
1170f19b1fSKris Buschelman 
1270f19b1fSKris Buschelman   PetscFunctionBegin;
13a1a86e44SBarry Smith   ierr = PetscMalloc(sizeof(struct _Space),&a);CHKERRQ(ierr);
142e111b49SBarry Smith   ierr = PetscMalloc(n*sizeof(PetscInt),&(a->array_head));CHKERRQ(ierr);
1570f19b1fSKris Buschelman   a->array            = a->array_head;
162e111b49SBarry Smith   a->local_remaining  = n;
1770f19b1fSKris Buschelman   a->local_used       = 0;
1870f19b1fSKris Buschelman   a->total_array_size = 0;
1970f19b1fSKris Buschelman   a->more_space       = NULL;
2070f19b1fSKris Buschelman 
2170f19b1fSKris Buschelman   if (*list) {
2270f19b1fSKris Buschelman     (*list)->more_space = a;
2370f19b1fSKris Buschelman     a->total_array_size = (*list)->total_array_size;
2470f19b1fSKris Buschelman   }
2570f19b1fSKris Buschelman 
262e111b49SBarry Smith   a->total_array_size += n;
2770f19b1fSKris Buschelman   *list               =  a;
2870f19b1fSKris Buschelman   PetscFunctionReturn(0);
2970f19b1fSKris Buschelman }
3070f19b1fSKris Buschelman 
3170f19b1fSKris Buschelman #undef __FUNCT__
32a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceContiguous"
33a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceContiguous(PetscFreeSpaceList *head,PetscInt *space)
3438baddfdSBarry Smith {
35a1a86e44SBarry Smith   PetscFreeSpaceList a;
36dfbe8321SBarry Smith   PetscErrorCode     ierr;
3770f19b1fSKris Buschelman 
3870f19b1fSKris Buschelman   PetscFunctionBegin;
39c05d87d6SBarry Smith   while ((*head)) {
4070f19b1fSKris Buschelman     a     =  (*head)->more_space;
412e111b49SBarry Smith     ierr  =  PetscMemcpy(space,(*head)->array_head,((*head)->local_used)*sizeof(PetscInt));CHKERRQ(ierr);
4270f19b1fSKris Buschelman     space += (*head)->local_used;
4370f19b1fSKris Buschelman     ierr  =  PetscFree((*head)->array_head);CHKERRQ(ierr);
4470f19b1fSKris Buschelman     ierr  =  PetscFree(*head);CHKERRQ(ierr);
4570f19b1fSKris Buschelman     *head =  a;
4670f19b1fSKris Buschelman   }
4770f19b1fSKris Buschelman   PetscFunctionReturn(0);
4870f19b1fSKris Buschelman }
497a48dd6fSHong Zhang 
5030cb48eeSHong Zhang /*
51783ef271SHong Zhang   PetscFreeSpaceContiguous_LU -
52783ef271SHong Zhang     Copy a linket list obtained from matrix symbolic ILU or LU factorization into a contiguous array
53783ef271SHong Zhang   that enables an efficient matrix triangular solve.
5430cb48eeSHong Zhang 
5530cb48eeSHong Zhang    Input Parameters:
56783ef271SHong Zhang +  head - linked list of column indices obtained from matrix symbolic ILU or LU factorization
57783ef271SHong Zhang .  space - an allocated int array with length nnz of factored matrix.
5830cb48eeSHong Zhang .  n - order of the matrix
592ce24eb6SHong Zhang .  bi - row pointer of factored matrix L with length n+1.
602ce24eb6SHong Zhang -  bdiag - int array of length n+1. bdiag[i] points to diagonal of U(i,:), and bdiag[n] points to entry of U(n-1,0)-1.
6130cb48eeSHong Zhang 
6230cb48eeSHong Zhang    Output Parameter:
6330cb48eeSHong Zhang .  space - column indices are copied into this int array with contiguous layout of L and U
64783ef271SHong Zhang 
652ce24eb6SHong Zhang    See MatILUFactorSymbolic_SeqAIJ_ilu0() for detailed data structure of L and U
6630cb48eeSHong Zhang */
677a48dd6fSHong Zhang #undef __FUNCT__
68783ef271SHong Zhang #define __FUNCT__ "PetscFreeSpaceContiguous_LU"
69783ef271SHong Zhang PetscErrorCode PetscFreeSpaceContiguous_LU(PetscFreeSpaceList *head,PetscInt *space,PetscInt n,PetscInt *bi,PetscInt *bdiag)
7012b5cbf3SHong Zhang {
7112b5cbf3SHong Zhang   PetscFreeSpaceList a;
7212b5cbf3SHong Zhang   PetscErrorCode     ierr;
73f268cba8SShri Abhyankar   PetscInt           row,nnz,*bj,*array,total,bi_temp;
74f268cba8SShri Abhyankar   PetscInt           nnzL,nnzU;
75f268cba8SShri Abhyankar 
76f268cba8SShri Abhyankar   PetscFunctionBegin;
77f268cba8SShri Abhyankar   bi_temp = bi[n];
78f268cba8SShri Abhyankar   row       = 0;
79f268cba8SShri Abhyankar   total     = 0;
80f268cba8SShri Abhyankar   nnzL  = bdiag[0];
81f268cba8SShri Abhyankar   while ((*head)!=NULL) {
82f268cba8SShri Abhyankar     total += (*head)->local_used;
83f268cba8SShri Abhyankar     array  = (*head)->array_head;
84f268cba8SShri Abhyankar 
85*0e97c5f4SHong Zhang     while (row < n) {
86*0e97c5f4SHong Zhang       if (bi[row+1] > total) break;
87f268cba8SShri Abhyankar       /* copy array entries into bj for this row */
88f268cba8SShri Abhyankar       nnz  = bi[row+1] - bi[row];
89f268cba8SShri Abhyankar       /* set bi[row] for new datastruct */
90f268cba8SShri Abhyankar       if (row == 0 ){
91f268cba8SShri Abhyankar         bi[row] = 0;
92f268cba8SShri Abhyankar       } else {
93f268cba8SShri Abhyankar         bi[row] = bi[row-1] + nnzL; /* nnzL of previous row */
94f268cba8SShri Abhyankar       }
95f268cba8SShri Abhyankar 
96f268cba8SShri Abhyankar       /* L part */
97f268cba8SShri Abhyankar       nnzL = bdiag[row];
98f268cba8SShri Abhyankar       bj   = space+bi[row];
99f268cba8SShri Abhyankar       ierr = PetscMemcpy(bj,array,nnzL*sizeof(PetscInt));CHKERRQ(ierr);
100f268cba8SShri Abhyankar 
101f268cba8SShri Abhyankar       /* diagonal entry */
102f268cba8SShri Abhyankar       bdiag[row] = bi_temp - 1;
103f268cba8SShri Abhyankar       space[bdiag[row]] = row;
104f268cba8SShri Abhyankar 
105f268cba8SShri Abhyankar       /* U part */
106f268cba8SShri Abhyankar       nnzU        = nnz - nnzL;
107f268cba8SShri Abhyankar       bi_temp = bi_temp - nnzU;
108f268cba8SShri Abhyankar       nnzU --;      /* exclude diagonal */
109f268cba8SShri Abhyankar       bj = space + bi_temp;
110f268cba8SShri Abhyankar       ierr = PetscMemcpy(bj,array+nnzL+1,nnzU*sizeof(PetscInt));CHKERRQ(ierr);
111f268cba8SShri Abhyankar       array += nnz;
112f268cba8SShri Abhyankar       row++;
113f268cba8SShri Abhyankar     }
114f268cba8SShri Abhyankar 
115f268cba8SShri Abhyankar     a     = (*head)->more_space;
116f268cba8SShri Abhyankar     ierr  = PetscFree((*head)->array_head);CHKERRQ(ierr);
117f268cba8SShri Abhyankar     ierr  = PetscFree(*head);CHKERRQ(ierr);
118f268cba8SShri Abhyankar     *head = a;
119f268cba8SShri Abhyankar   }
120f268cba8SShri Abhyankar   bi[n] = bi[n-1] + nnzL;
121f268cba8SShri Abhyankar   bdiag[n] = bdiag[n-1]-1;
122f268cba8SShri Abhyankar   PetscFunctionReturn(0);
123f268cba8SShri Abhyankar }
124f268cba8SShri Abhyankar 
125783ef271SHong Zhang /*
126783ef271SHong Zhang   PetscFreeSpaceContiguous_Cholesky -
127783ef271SHong Zhang     Copy a linket list obtained from matrix symbolic ICC or Cholesky factorization into a contiguous array
128783ef271SHong Zhang   that enables an efficient matrix triangular solve.
129783ef271SHong Zhang 
130783ef271SHong Zhang    Input Parameters:
131783ef271SHong Zhang +  head - linked list of column indices obtained from matrix symbolic ICC or Cholesky factorization
132783ef271SHong Zhang .  space - an allocated int array with length nnz of factored matrix.
133783ef271SHong Zhang .  n - order of the matrix
134783ef271SHong Zhang .  ui - row pointer of factored matrix with length n+1. All entries are set based on the traditional layout U matrix.
135783ef271SHong Zhang -  udiag - int array of length n.
136783ef271SHong Zhang 
137783ef271SHong Zhang    Output Parameter:
138783ef271SHong Zhang +  space - column indices are copied into this int array with contiguous layout of U, with diagonal located as the last entry in each row
139783ef271SHong Zhang -  udiag - indices of diagonal entries
140783ef271SHong Zhang 
141783ef271SHong Zhang    See MatICCFactorSymbolic_SeqAIJ_newdatastruct() for detailed description.
142783ef271SHong Zhang */
143783ef271SHong Zhang 
144783ef271SHong Zhang #undef __FUNCT__
145783ef271SHong Zhang #define __FUNCT__ "PetscFreeSpaceContiguous_Cholesky"
146783ef271SHong Zhang PetscErrorCode PetscFreeSpaceContiguous_Cholesky(PetscFreeSpaceList *head,PetscInt *space,PetscInt n,PetscInt *ui,PetscInt *udiag)
147783ef271SHong Zhang {
148783ef271SHong Zhang   PetscFreeSpaceList a;
149783ef271SHong Zhang   PetscErrorCode     ierr;
150783ef271SHong Zhang   PetscInt           row,nnz,*uj,*array,total;
151783ef271SHong Zhang 
152783ef271SHong Zhang   PetscFunctionBegin;
153783ef271SHong Zhang   row   = 0;
154783ef271SHong Zhang   total = 0;
155*0e97c5f4SHong Zhang   while (*head) {
156783ef271SHong Zhang     total += (*head)->local_used;
157783ef271SHong Zhang     array  = (*head)->array_head;
158783ef271SHong Zhang 
159*0e97c5f4SHong Zhang     while (row < n){
160*0e97c5f4SHong Zhang       if (ui[row+1] > total) break;
161783ef271SHong Zhang       udiag[row] = ui[row+1] - 1;     /* points to the last entry of U(row,:) */
162783ef271SHong Zhang       nnz  = ui[row+1] - ui[row] - 1; /* exclude diagonal */
163783ef271SHong Zhang       uj   = space + ui[row];
164783ef271SHong Zhang       ierr = PetscMemcpy(uj,array+1,nnz*sizeof(PetscInt));CHKERRQ(ierr);
165783ef271SHong Zhang       uj[nnz] = array[0]; /* diagonal */
166783ef271SHong Zhang       array += nnz + 1;
167783ef271SHong Zhang       row++;
168783ef271SHong Zhang     }
169783ef271SHong Zhang 
170783ef271SHong Zhang     a     = (*head)->more_space;
171783ef271SHong Zhang     ierr  = PetscFree((*head)->array_head);CHKERRQ(ierr);
172783ef271SHong Zhang     ierr  = PetscFree(*head);CHKERRQ(ierr);
173783ef271SHong Zhang     *head = a;
174783ef271SHong Zhang   }
175783ef271SHong Zhang   PetscFunctionReturn(0);
176783ef271SHong Zhang }
177783ef271SHong Zhang 
17812b5cbf3SHong Zhang #undef __FUNCT__
179a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceDestroy"
180a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceDestroy(PetscFreeSpaceList head)
1817a48dd6fSHong Zhang {
182a1a86e44SBarry Smith   PetscFreeSpaceList a;
1837a48dd6fSHong Zhang   PetscErrorCode     ierr;
1847a48dd6fSHong Zhang 
1857a48dd6fSHong Zhang   PetscFunctionBegin;
1867a48dd6fSHong Zhang   while ((head)!=NULL) {
1877a48dd6fSHong Zhang     a    = (head)->more_space;
1887a48dd6fSHong Zhang     ierr = PetscFree((head)->array_head);CHKERRQ(ierr);
1897a48dd6fSHong Zhang     ierr = PetscFree(head);CHKERRQ(ierr);
1907a48dd6fSHong Zhang     head = a;
1917a48dd6fSHong Zhang   }
1927a48dd6fSHong Zhang   PetscFunctionReturn(0);
1937a48dd6fSHong Zhang }
194