xref: /petsc/src/mat/utils/freespace.c (revision 8865f1ea4ea560cd84ab8db62e98b7095cdff96f)
1be1d678aSKris Buschelman 
2c6db04a5SJed Brown #include <../src/mat/utils/freespace.h>
370f19b1fSKris Buschelman 
470f19b1fSKris Buschelman #undef __FUNCT__
5a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceGet"
6a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceGet(PetscInt n,PetscFreeSpaceList *list)
72e111b49SBarry Smith {
8a1a86e44SBarry Smith   PetscFreeSpaceList a;
9dfbe8321SBarry Smith   PetscErrorCode     ierr;
1070f19b1fSKris Buschelman 
1170f19b1fSKris Buschelman   PetscFunctionBegin;
12a1a86e44SBarry Smith   ierr = PetscMalloc(sizeof(struct _Space),&a);CHKERRQ(ierr);
132e111b49SBarry Smith   ierr = PetscMalloc(n*sizeof(PetscInt),&(a->array_head));CHKERRQ(ierr);
14*8865f1eaSKarl Rupp 
1570f19b1fSKris Buschelman   a->array            = a->array_head;
162e111b49SBarry Smith   a->local_remaining  = n;
1770f19b1fSKris Buschelman   a->local_used       = 0;
1870f19b1fSKris Buschelman   a->total_array_size = 0;
19c722e25dSBarry Smith   a->more_space       = PETSC_NULL;
2070f19b1fSKris Buschelman 
2170f19b1fSKris Buschelman   if (*list) {
2270f19b1fSKris Buschelman     (*list)->more_space = a;
2370f19b1fSKris Buschelman     a->total_array_size = (*list)->total_array_size;
2470f19b1fSKris Buschelman   }
2570f19b1fSKris Buschelman 
262e111b49SBarry Smith   a->total_array_size += n;
2770f19b1fSKris Buschelman   *list                =  a;
2870f19b1fSKris Buschelman   PetscFunctionReturn(0);
2970f19b1fSKris Buschelman }
3070f19b1fSKris Buschelman 
3170f19b1fSKris Buschelman #undef __FUNCT__
32a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceContiguous"
33a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceContiguous(PetscFreeSpaceList *head,PetscInt *space)
3438baddfdSBarry Smith {
35a1a86e44SBarry Smith   PetscFreeSpaceList a;
36dfbe8321SBarry Smith   PetscErrorCode     ierr;
3770f19b1fSKris Buschelman 
3870f19b1fSKris Buschelman   PetscFunctionBegin;
39c05d87d6SBarry Smith   while ((*head)) {
4070f19b1fSKris Buschelman     a      =  (*head)->more_space;
412e111b49SBarry Smith     ierr   =  PetscMemcpy(space,(*head)->array_head,((*head)->local_used)*sizeof(PetscInt));CHKERRQ(ierr);
4270f19b1fSKris Buschelman     space += (*head)->local_used;
4370f19b1fSKris Buschelman     ierr   =  PetscFree((*head)->array_head);CHKERRQ(ierr);
4470f19b1fSKris Buschelman     ierr   =  PetscFree(*head);CHKERRQ(ierr);
4570f19b1fSKris Buschelman     *head  =  a;
4670f19b1fSKris Buschelman   }
4770f19b1fSKris Buschelman   PetscFunctionReturn(0);
4870f19b1fSKris Buschelman }
497a48dd6fSHong Zhang 
5030cb48eeSHong Zhang /*
51783ef271SHong Zhang   PetscFreeSpaceContiguous_LU -
52783ef271SHong Zhang     Copy a linket list obtained from matrix symbolic ILU or LU factorization into a contiguous array
53783ef271SHong Zhang   that enables an efficient matrix triangular solve.
5430cb48eeSHong Zhang 
5530cb48eeSHong Zhang    Input Parameters:
56783ef271SHong Zhang +  head - linked list of column indices obtained from matrix symbolic ILU or LU factorization
57783ef271SHong Zhang .  space - an allocated int array with length nnz of factored matrix.
5830cb48eeSHong Zhang .  n - order of the matrix
592ce24eb6SHong Zhang .  bi - row pointer of factored matrix L with length n+1.
602ce24eb6SHong Zhang -  bdiag - int array of length n+1. bdiag[i] points to diagonal of U(i,:), and bdiag[n] points to entry of U(n-1,0)-1.
6130cb48eeSHong Zhang 
6230cb48eeSHong Zhang    Output Parameter:
6330cb48eeSHong Zhang .  space - column indices are copied into this int array with contiguous layout of L and U
64783ef271SHong Zhang 
652ce24eb6SHong Zhang    See MatILUFactorSymbolic_SeqAIJ_ilu0() for detailed data structure of L and U
6630cb48eeSHong Zhang */
677a48dd6fSHong Zhang #undef __FUNCT__
68783ef271SHong Zhang #define __FUNCT__ "PetscFreeSpaceContiguous_LU"
69783ef271SHong Zhang PetscErrorCode PetscFreeSpaceContiguous_LU(PetscFreeSpaceList *head,PetscInt *space,PetscInt n,PetscInt *bi,PetscInt *bdiag)
7012b5cbf3SHong Zhang {
7112b5cbf3SHong Zhang   PetscFreeSpaceList a;
7212b5cbf3SHong Zhang   PetscErrorCode     ierr;
73f268cba8SShri Abhyankar   PetscInt           row,nnz,*bj,*array,total,bi_temp;
74f268cba8SShri Abhyankar   PetscInt           nnzL,nnzU;
75f268cba8SShri Abhyankar 
76f268cba8SShri Abhyankar   PetscFunctionBegin;
77f268cba8SShri Abhyankar   bi_temp = bi[n];
78f268cba8SShri Abhyankar   row     = 0;
79f268cba8SShri Abhyankar   total   = 0;
80f268cba8SShri Abhyankar   nnzL    = bdiag[0];
81c722e25dSBarry Smith   while ((*head)) {
82f268cba8SShri Abhyankar     total += (*head)->local_used;
83f268cba8SShri Abhyankar     array  = (*head)->array_head;
84f268cba8SShri Abhyankar 
850e97c5f4SHong Zhang     while (row < n) {
860e97c5f4SHong Zhang       if (bi[row+1] > total) break;
87f268cba8SShri Abhyankar       /* copy array entries into bj for this row */
88f268cba8SShri Abhyankar       nnz = bi[row+1] - bi[row];
89f268cba8SShri Abhyankar       /* set bi[row] for new datastruct */
90f268cba8SShri Abhyankar       if (row == 0) {
91f268cba8SShri Abhyankar         bi[row] = 0;
92f268cba8SShri Abhyankar       } else {
93f268cba8SShri Abhyankar         bi[row] = bi[row-1] + nnzL; /* nnzL of previous row */
94f268cba8SShri Abhyankar       }
95f268cba8SShri Abhyankar 
96f268cba8SShri Abhyankar       /* L part */
97f268cba8SShri Abhyankar       nnzL = bdiag[row];
98f268cba8SShri Abhyankar       bj   = space+bi[row];
99f268cba8SShri Abhyankar       ierr = PetscMemcpy(bj,array,nnzL*sizeof(PetscInt));CHKERRQ(ierr);
100f268cba8SShri Abhyankar 
101f268cba8SShri Abhyankar       /* diagonal entry */
102f268cba8SShri Abhyankar       bdiag[row]        = bi_temp - 1;
103f268cba8SShri Abhyankar       space[bdiag[row]] = row;
104f268cba8SShri Abhyankar 
105f268cba8SShri Abhyankar       /* U part */
106f268cba8SShri Abhyankar       nnzU    = nnz - nnzL;
107f268cba8SShri Abhyankar       bi_temp = bi_temp - nnzU;
108f268cba8SShri Abhyankar       nnzU--;       /* exclude diagonal */
109f268cba8SShri Abhyankar       bj     = space + bi_temp;
110f268cba8SShri Abhyankar       ierr   = PetscMemcpy(bj,array+nnzL+1,nnzU*sizeof(PetscInt));CHKERRQ(ierr);
111f268cba8SShri Abhyankar       array += nnz;
112f268cba8SShri Abhyankar       row++;
113f268cba8SShri Abhyankar     }
114f268cba8SShri Abhyankar 
115f268cba8SShri Abhyankar     a     = (*head)->more_space;
116f268cba8SShri Abhyankar     ierr  = PetscFree((*head)->array_head);CHKERRQ(ierr);
117f268cba8SShri Abhyankar     ierr  = PetscFree(*head);CHKERRQ(ierr);
118f268cba8SShri Abhyankar     *head = a;
119f268cba8SShri Abhyankar   }
12043c97eaeSBarry Smith   if (n) {
121f268cba8SShri Abhyankar     bi[n]    = bi[n-1] + nnzL;
122f268cba8SShri Abhyankar     bdiag[n] = bdiag[n-1]-1;
12343c97eaeSBarry Smith   }
124f268cba8SShri Abhyankar   PetscFunctionReturn(0);
125f268cba8SShri Abhyankar }
126f268cba8SShri Abhyankar 
127783ef271SHong Zhang /*
128783ef271SHong Zhang   PetscFreeSpaceContiguous_Cholesky -
129783ef271SHong Zhang     Copy a linket list obtained from matrix symbolic ICC or Cholesky factorization into a contiguous array
130783ef271SHong Zhang   that enables an efficient matrix triangular solve.
131783ef271SHong Zhang 
132783ef271SHong Zhang    Input Parameters:
133783ef271SHong Zhang +  head - linked list of column indices obtained from matrix symbolic ICC or Cholesky factorization
134783ef271SHong Zhang .  space - an allocated int array with length nnz of factored matrix.
135783ef271SHong Zhang .  n - order of the matrix
136783ef271SHong Zhang .  ui - row pointer of factored matrix with length n+1. All entries are set based on the traditional layout U matrix.
137783ef271SHong Zhang -  udiag - int array of length n.
138783ef271SHong Zhang 
139783ef271SHong Zhang    Output Parameter:
140783ef271SHong Zhang +  space - column indices are copied into this int array with contiguous layout of U, with diagonal located as the last entry in each row
141783ef271SHong Zhang -  udiag - indices of diagonal entries
142783ef271SHong Zhang 
143783ef271SHong Zhang    See MatICCFactorSymbolic_SeqAIJ_newdatastruct() for detailed description.
144783ef271SHong Zhang */
145783ef271SHong Zhang 
146783ef271SHong Zhang #undef __FUNCT__
147783ef271SHong Zhang #define __FUNCT__ "PetscFreeSpaceContiguous_Cholesky"
148783ef271SHong Zhang PetscErrorCode PetscFreeSpaceContiguous_Cholesky(PetscFreeSpaceList *head,PetscInt *space,PetscInt n,PetscInt *ui,PetscInt *udiag)
149783ef271SHong Zhang {
150783ef271SHong Zhang   PetscFreeSpaceList a;
151783ef271SHong Zhang   PetscErrorCode     ierr;
152783ef271SHong Zhang   PetscInt           row,nnz,*uj,*array,total;
153783ef271SHong Zhang 
154783ef271SHong Zhang   PetscFunctionBegin;
155783ef271SHong Zhang   row   = 0;
156783ef271SHong Zhang   total = 0;
1570e97c5f4SHong Zhang   while (*head) {
158783ef271SHong Zhang     total += (*head)->local_used;
159783ef271SHong Zhang     array  = (*head)->array_head;
160783ef271SHong Zhang 
1610e97c5f4SHong Zhang     while (row < n) {
1620e97c5f4SHong Zhang       if (ui[row+1] > total) break;
163783ef271SHong Zhang       udiag[row] = ui[row+1] - 1;     /* points to the last entry of U(row,:) */
164783ef271SHong Zhang       nnz        = ui[row+1] - ui[row] - 1; /* exclude diagonal */
165783ef271SHong Zhang       uj         = space + ui[row];
166783ef271SHong Zhang       ierr       = PetscMemcpy(uj,array+1,nnz*sizeof(PetscInt));CHKERRQ(ierr);
167783ef271SHong Zhang       uj[nnz]    = array[0]; /* diagonal */
168783ef271SHong Zhang       array     += nnz + 1;
169783ef271SHong Zhang       row++;
170783ef271SHong Zhang     }
171783ef271SHong Zhang 
172783ef271SHong Zhang     a     = (*head)->more_space;
173783ef271SHong Zhang     ierr  = PetscFree((*head)->array_head);CHKERRQ(ierr);
174783ef271SHong Zhang     ierr  = PetscFree(*head);CHKERRQ(ierr);
175783ef271SHong Zhang     *head = a;
176783ef271SHong Zhang   }
177783ef271SHong Zhang   PetscFunctionReturn(0);
178783ef271SHong Zhang }
179783ef271SHong Zhang 
18012b5cbf3SHong Zhang #undef __FUNCT__
181a1a86e44SBarry Smith #define __FUNCT__ "PetscFreeSpaceDestroy"
182a1a86e44SBarry Smith PetscErrorCode PetscFreeSpaceDestroy(PetscFreeSpaceList head)
1837a48dd6fSHong Zhang {
184a1a86e44SBarry Smith   PetscFreeSpaceList a;
1857a48dd6fSHong Zhang   PetscErrorCode     ierr;
1867a48dd6fSHong Zhang 
1877a48dd6fSHong Zhang   PetscFunctionBegin;
188c722e25dSBarry Smith   while ((head)) {
1897a48dd6fSHong Zhang     a    = (head)->more_space;
1907a48dd6fSHong Zhang     ierr = PetscFree((head)->array_head);CHKERRQ(ierr);
1917a48dd6fSHong Zhang     ierr = PetscFree(head);CHKERRQ(ierr);
1927a48dd6fSHong Zhang     head = a;
1937a48dd6fSHong Zhang   }
1947a48dd6fSHong Zhang   PetscFunctionReturn(0);
1957a48dd6fSHong Zhang }
196