Subversion Repositories slepc-dev

Rev

Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
1298 slepc 1
/*                      
2
 
3
   SLEPc singular value solver: "trlanczos"
4
 
5
   Method: Golub-Kahan-Lanczos bidiagonalization with thick-restart
6
 
1328 slepc 7
   Last update: Mar 2007
1298 slepc 8
 
1376 slepc 9
   - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
10
      SLEPc - Scalable Library for Eigenvalue Problem Computations
11
      Copyright (c) 2002-2007, Universidad Politecnica de Valencia, Spain
12
 
13
      This file is part of SLEPc. See the README file for conditions of use
14
      and additional information.
15
   - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
1298 slepc 16
*/
1376 slepc 17
 
1298 slepc 18
#include "src/svd/svdimpl.h"                /*I "slepcsvd.h" I*/
19
#include "slepcblaslapack.h"
20
 
21
typedef struct {
22
  PetscTruth oneside;
23
} SVD_TRLANCZOS;
24
 
25
#undef __FUNCT__  
26
#define __FUNCT__ "SVDSetUp_TRLANCZOS"
27
PetscErrorCode SVDSetUp_TRLANCZOS(SVD svd)
28
{
29
  PetscErrorCode  ierr;
1314 slepc 30
  PetscInt        N;
31
  int             i;
1298 slepc 32
 
33
  PetscFunctionBegin;
1314 slepc 34
  ierr = SVDMatGetSize(svd,PETSC_NULL,&N);CHKERRQ(ierr);
1298 slepc 35
  if (svd->ncv == PETSC_DECIDE)
1314 slepc 36
    svd->ncv = PetscMin(N,PetscMax(2*svd->nsv,10));
1298 slepc 37
  if (svd->max_it == PETSC_DECIDE)
1314 slepc 38
    svd->max_it = PetscMax(N/svd->ncv,100);
39
  if (svd->ncv!=svd->n) {  
40
    if (svd->U) {
41
      for (i=0;i<svd->n;i++) { ierr = VecDestroy(svd->U[i]); CHKERRQ(ierr); }
42
      ierr = PetscFree(svd->U);CHKERRQ(ierr);
43
    }
44
    ierr = PetscMalloc(sizeof(Vec)*svd->ncv,&svd->U);CHKERRQ(ierr);
45
    for (i=0;i<svd->ncv;i++) { ierr = SVDMatGetVecs(svd,PETSC_NULL,svd->U+i);CHKERRQ(ierr); }
46
  }
1298 slepc 47
  PetscFunctionReturn(0);
48
}
49
 
50
#undef __FUNCT__  
1328 slepc 51
#define __FUNCT__ "SVDOneSideTRLanczos"
52
static PetscErrorCode SVDOneSideTRLanczos(SVD svd,PetscReal *alpha,PetscReal *beta,PetscScalar* bb,Vec *V,Vec v,Vec* U,int nconv,int l,int n,PetscScalar* work,Vec wv,Vec wu)
53
{
54
  PetscErrorCode ierr;
55
  PetscReal      a,b;
56
  int            i,j,k=nconv+l;
57
 
58
  PetscFunctionBegin;
59
  ierr = SVDMatMult(svd,PETSC_FALSE,V[k],U[k]);CHKERRQ(ierr);
60
  if (l>0) {
61
    ierr = VecSet(wu,0.0);CHKERRQ(ierr);
62
    ierr = VecMAXPY(wu,l,bb,U+nconv);CHKERRQ(ierr);
63
    ierr = VecAXPY(U[k],-1.0,wu);CHKERRQ(ierr);
64
  }
65
  for (i=k+1;i<n;i++) {
66
    ierr = SVDMatMult(svd,PETSC_TRUE,U[i-1],V[i]);CHKERRQ(ierr);
1352 slepc 67
    ierr = IPNormBegin(svd->ip,U[i-1],&a);CHKERRQ(ierr);
68
    ierr = IPMInnerProductBegin(svd->ip,i,V[i],V,work);CHKERRQ(ierr);
69
    ierr = IPNormEnd(svd->ip,U[i-1],&a);CHKERRQ(ierr);
70
    ierr = IPMInnerProductEnd(svd->ip,i,V[i],V,work);CHKERRQ(ierr);
1328 slepc 71
 
72
    ierr = VecScale(U[i-1],1.0/a);CHKERRQ(ierr);
73
    ierr = VecScale(V[i],1.0/a);CHKERRQ(ierr);
74
    for (j=0;j<i;j++) work[j] = - work[j] / a;
75
    ierr = VecMAXPY(V[i],i,work,V);CHKERRQ(ierr);
76
 
77
    ierr = IPOrthogonalizeCGS(svd->ip,i,PETSC_NULL,V,V[i],work,PETSC_NULL,&b,wv);CHKERRQ(ierr);
78
    ierr = VecScale(V[i],1.0/b);CHKERRQ(ierr);
79
 
80
    ierr = SVDMatMult(svd,PETSC_FALSE,V[i],U[i]);CHKERRQ(ierr);
81
    ierr = VecAXPY(U[i],-b,U[i-1]);CHKERRQ(ierr);
82
 
83
    alpha[i-k-1] = a;
84
    beta[i-k-1] = b;
85
  }
86
  ierr = SVDMatMult(svd,PETSC_TRUE,U[n-1],v);CHKERRQ(ierr);
1352 slepc 87
  ierr = IPNormBegin(svd->ip,U[n-1],&a);CHKERRQ(ierr);
88
  ierr = IPMInnerProductBegin(svd->ip,n,v,V,work);CHKERRQ(ierr);
89
  ierr = IPNormEnd(svd->ip,U[n-1],&a);CHKERRQ(ierr);
90
  ierr = IPMInnerProductEnd(svd->ip,n,v,V,work);CHKERRQ(ierr);
1328 slepc 91
 
92
  ierr = VecScale(U[n-1],1.0/a);CHKERRQ(ierr);
93
  ierr = VecScale(v,1.0/a);CHKERRQ(ierr);
94
  for (j=0;j<n;j++) work[j] = - work[j] / a;
95
  ierr = VecMAXPY(v,n,work,V);CHKERRQ(ierr);
96
 
97
  ierr = IPOrthogonalizeCGS(svd->ip,n,PETSC_NULL,V,v,work,PETSC_NULL,&b,wv);CHKERRQ(ierr);
98
 
99
  alpha[n-k-1] = a;
100
  beta[n-k-1] = b;
101
  PetscFunctionReturn(0);
102
}
103
 
104
#undef __FUNCT__  
1298 slepc 105
#define __FUNCT__ "SVDSolve_TRLANCZOS"
106
PetscErrorCode SVDSolve_TRLANCZOS(SVD svd)
107
{
108
  PetscErrorCode ierr;
109
  SVD_TRLANCZOS  *lanczos = (SVD_TRLANCZOS *)svd->data;
1328 slepc 110
  PetscReal      *alpha,*beta,norm;
1341 slepc 111
  PetscScalar    *b,*Q,*PT,*swork;
1328 slepc 112
  PetscInt       *perm;
113
  int            i,j,k,l,m,n,nwork=0;
114
  Vec            v,wv,wu,*workV,*workU,*permV,*permU;
115
  PetscTruth     conv;
1298 slepc 116
 
117
  PetscFunctionBegin;
118
  /* allocate working space */
1307 slepc 119
  ierr = PetscMalloc(sizeof(PetscReal)*svd->n,&alpha);CHKERRQ(ierr);
120
  ierr = PetscMalloc(sizeof(PetscReal)*svd->n,&beta);CHKERRQ(ierr);
121
  ierr = PetscMalloc(sizeof(PetscScalar)*svd->n,&b);CHKERRQ(ierr);
122
  ierr = PetscMalloc(sizeof(PetscScalar)*svd->n*svd->n,&Q);CHKERRQ(ierr);
123
  ierr = PetscMalloc(sizeof(PetscScalar)*svd->n*svd->n,&PT);CHKERRQ(ierr);
1341 slepc 124
  ierr = PetscMalloc(sizeof(PetscScalar)*svd->n,&swork);CHKERRQ(ierr);
1328 slepc 125
  ierr = VecDuplicate(svd->V[0],&v);CHKERRQ(ierr);
126
  ierr = VecDuplicate(svd->V[0],&wv);CHKERRQ(ierr);
127
  ierr = VecDuplicate(svd->U[0],&wu);CHKERRQ(ierr);
128
  ierr = PetscMalloc(sizeof(Vec)*svd->n,&workV);CHKERRQ(ierr);
129
  ierr = PetscMalloc(sizeof(Vec)*svd->n,&workU);CHKERRQ(ierr);
1298 slepc 130
 
131
  /* normalize start vector */
1328 slepc 132
  ierr = VecCopy(svd->vec_initial,svd->V[0]);CHKERRQ(ierr);
133
  ierr = VecNormalize(svd->V[0],&norm);CHKERRQ(ierr);
1298 slepc 134
 
135
  l = 0;
136
  while (svd->reason == SVD_CONVERGED_ITERATING) {
137
    svd->its++;
138
 
139
    /* inner loop */
1328 slepc 140
    if (lanczos->oneside) {
1341 slepc 141
      ierr = SVDOneSideTRLanczos(svd,alpha,beta,b+svd->nconv,svd->V,v,svd->U,svd->nconv,l,svd->n,swork,wv,wu);CHKERRQ(ierr);
1328 slepc 142
    } else {
1341 slepc 143
      ierr = SVDTwoSideLanczos(svd,alpha,beta,svd->V,v,svd->U,svd->nconv+l,svd->n,swork,wv,wu);CHKERRQ(ierr);
1298 slepc 144
    }
1328 slepc 145
    ierr = VecScale(v,1.0/beta[svd->n-svd->nconv-l-1]);CHKERRQ(ierr);
146
 
1298 slepc 147
    /* compute SVD of general matrix */
1328 slepc 148
    n = svd->n - svd->nconv;
1298 slepc 149
    /* first l columns */
150
    for (j=0;j<l;j++) {
151
      for (i=0;i<j;i++) Q[j*n+i] = 0.0;    
1328 slepc 152
      Q[j*n+j] = svd->sigma[svd->nconv+j];
1298 slepc 153
      for (i=j+1;i<n;i++) Q[j*n+i] = 0.0;
154
    }
155
    /* l+1 column */
1328 slepc 156
    for (i=0;i<l;i++) Q[l*n+i] = b[i+svd->nconv];
157
    Q[l*n+l] = alpha[0];
1298 slepc 158
    for (i=l+1;i<n;i++) Q[l*n+i] = 0.0;
159
    /* rest of matrix */
160
    for (j=l+1;j<n;j++) {
161
      for (i=0;i<j-1;i++) Q[j*n+i] = 0.0;
1328 slepc 162
      Q[j*n+j-1] = beta[j-l-1];
163
      Q[j*n+j] = alpha[j-l];
1298 slepc 164
      for (i=j+1;i<n;i++) Q[j*n+i] = 0.0;
165
    }
1328 slepc 166
    ierr = SVDDense(n,n,Q,alpha,PETSC_NULL,PT);CHKERRQ(ierr);
1298 slepc 167
 
168
    /* compute error estimates */
1328 slepc 169
    k = 0;
170
    conv = PETSC_TRUE;
171
    for (i=svd->nconv;i<svd->n;i++) {
172
      if (svd->which == SVD_SMALLEST) j = n-i+svd->nconv-1;
173
      else j = i-svd->nconv;
174
      svd->sigma[i] = alpha[j];
175
      b[i] = Q[j*n+n-1]*beta[n-l-1];
176
      svd->errest[i] = PetscAbsScalar(b[i]);
177
      if (alpha[j] > svd->tol) svd->errest[i] /= alpha[j];
178
      if (conv) {
179
        if (svd->errest[i] < svd->tol) k++;
180
        else conv = PETSC_FALSE;
1304 slepc 181
      }
1298 slepc 182
    }
183
 
1328 slepc 184
    /* check convergence and update l */
185
    if (svd->its >= svd->max_it) svd->reason = SVD_DIVERGED_ITS;
186
    if (svd->nconv+k >= svd->nsv) svd->reason = SVD_CONVERGED_TOL;
187
    if (svd->reason != SVD_CONVERGED_ITERATING) l = 0;
188
    else l = PetscMax((svd->n - svd->nconv - k) / 2,1);
1300 slepc 189
 
1328 slepc 190
    /* allocate work space for converged singular and restart vectors */
191
    if (nwork<k+l) {
192
      for (i=nwork;i<k+l;i++) {
193
        ierr = SVDMatGetVecs(svd,workV+i,workU+i);CHKERRQ(ierr);
1300 slepc 194
      }
1328 slepc 195
      nwork = k+l;
1298 slepc 196
    }
197
 
1328 slepc 198
    /* compute converged singular vectors and restart vectors*/
199
    for (i=0;i<k+l;i++) {
200
      if (svd->which == SVD_SMALLEST) j = n-i-1;
201
      else j = i;
202
      ierr = VecSet(workV[i],0.0);CHKERRQ(ierr);
1341 slepc 203
      for (m=0;m<n;m++) swork[m] = PT[m*n+j];
204
      ierr = VecMAXPY(workV[i],n,swork,svd->V+svd->nconv);CHKERRQ(ierr);
1328 slepc 205
      ierr = VecSet(workU[i],0.0);CHKERRQ(ierr);
206
      ierr = VecMAXPY(workU[i],n,Q+j*n,svd->U+svd->nconv);CHKERRQ(ierr);
207
    }
208
 
1298 slepc 209
    /* copy the last vector to be the next initial vector */
210
    if (svd->reason == SVD_CONVERGED_ITERATING) {
1328 slepc 211
      ierr = VecCopy(v,svd->V[svd->nconv+k+l]);CHKERRQ(ierr);
1298 slepc 212
    }
213
 
1328 slepc 214
    /* copy converged singular vectors and restart vectors from temporary space */
215
    for (i=0;i<k+l;i++) {
216
      ierr = VecCopy(workV[i],svd->V[i+svd->nconv]);CHKERRQ(ierr);
217
      ierr = VecCopy(workU[i],svd->U[i+svd->nconv]);CHKERRQ(ierr);
218
    }
219
 
220
    svd->nconv += k;
221
    SVDMonitor(svd,svd->its,svd->nconv,svd->sigma,svd->errest,svd->n);
1298 slepc 222
  }
223
 
224
  /* sort singular triplets */
225
  ierr = PetscMalloc(sizeof(PetscInt)*svd->nconv,&perm);CHKERRQ(ierr);
1328 slepc 226
  ierr = PetscMalloc(sizeof(Vec)*svd->nconv,&permV);CHKERRQ(ierr);
227
  ierr = PetscMalloc(sizeof(Vec)*svd->nconv,&permU);CHKERRQ(ierr);
1298 slepc 228
  for (i=0;i<svd->nconv;i++) {
229
    alpha[i] = svd->sigma[i];
230
    beta[i] = svd->errest[i];
1328 slepc 231
    permV[i] = svd->V[i];
232
    permU[i] = svd->U[i];
1298 slepc 233
    perm[i] = i;
234
  }
1328 slepc 235
  ierr = PetscSortRealWithPermutation(svd->nconv,svd->sigma,perm);CHKERRQ(ierr);
236
  for (i=0;i<svd->nconv;i++) {
1298 slepc 237
    if (svd->which == SVD_SMALLEST) j = perm[i];
1300 slepc 238
    else j = perm[svd->nconv-i-1];
1328 slepc 239
    svd->sigma[i] = alpha[j];
240
    svd->errest[i] = beta[j];
241
    svd->V[i] = permV[j];
242
    svd->U[i] = permU[j];
1298 slepc 243
  }
244
 
245
  /* free working space */
1328 slepc 246
  ierr = VecDestroy(v);CHKERRQ(ierr);
247
  ierr = VecDestroy(wv);CHKERRQ(ierr);
248
  ierr = VecDestroy(wu);CHKERRQ(ierr);
249
  for (i=0;i<nwork;i++) { ierr = VecDestroy(workV[i]);CHKERRQ(ierr); }
250
  ierr = PetscFree(workV);CHKERRQ(ierr);
251
  for (i=0;i<nwork;i++) { ierr = VecDestroy(workU[i]);CHKERRQ(ierr); }
252
  ierr = PetscFree(workU);CHKERRQ(ierr);
1298 slepc 253
 
254
  ierr = PetscFree(alpha);CHKERRQ(ierr);
255
  ierr = PetscFree(beta);CHKERRQ(ierr);
256
  ierr = PetscFree(b);CHKERRQ(ierr);
257
  ierr = PetscFree(Q);CHKERRQ(ierr);
258
  ierr = PetscFree(PT);CHKERRQ(ierr);
1341 slepc 259
  ierr = PetscFree(swork);CHKERRQ(ierr);
1298 slepc 260
  ierr = PetscFree(perm);CHKERRQ(ierr);
1328 slepc 261
  ierr = PetscFree(permV);CHKERRQ(ierr);
262
  ierr = PetscFree(permU);CHKERRQ(ierr);
1298 slepc 263
  PetscFunctionReturn(0);
264
}
265
 
266
#undef __FUNCT__  
267
#define __FUNCT__ "SVDSetFromOptions_TRLANCZOS"
268
PetscErrorCode SVDSetFromOptions_TRLANCZOS(SVD svd)
269
{
270
  PetscErrorCode ierr;
271
  SVD_TRLANCZOS  *lanczos = (SVD_TRLANCZOS *)svd->data;
272
 
273
  PetscFunctionBegin;
274
  ierr = PetscOptionsBegin(svd->comm,svd->prefix,"TRLANCZOS Singular Value Solver Options","SVD");CHKERRQ(ierr);
1359 slepc 275
  ierr = PetscOptionsTruth("-svd_trlanczos_oneside","Lanczos one-side reorthogonalization","SVDTRLanczosSetOneSide",PETSC_FALSE,&lanczos->oneside,PETSC_NULL);CHKERRQ(ierr);
1298 slepc 276
  ierr = PetscOptionsEnd();CHKERRQ(ierr);
277
  PetscFunctionReturn(0);
278
}
1370 slepc 279
 
1298 slepc 280
EXTERN_C_BEGIN
281
#undef __FUNCT__  
1359 slepc 282
#define __FUNCT__ "SVDTRLanczosSetOneSide_TRLANCZOS"
283
PetscErrorCode SVDTRLanczosSetOneSide_TRLANCZOS(SVD svd,PetscTruth oneside)
1298 slepc 284
{
285
  SVD_TRLANCZOS *lanczos = (SVD_TRLANCZOS *)svd->data;
286
 
287
  PetscFunctionBegin;
288
  lanczos->oneside = oneside;
289
  PetscFunctionReturn(0);
290
}
1370 slepc 291
EXTERN_C_END
1298 slepc 292
 
293
#undef __FUNCT__
1359 slepc 294
#define __FUNCT__ "SVDTRLanczosSetOneSide"
295
PetscErrorCode SVDTRLanczosSetOneSide(SVD svd,PetscTruth oneside)
1298 slepc 296
{
297
  PetscErrorCode ierr, (*f)(SVD,PetscTruth);
298
 
299
  PetscFunctionBegin;
300
  PetscValidHeaderSpecific(svd,SVD_COOKIE,1);
1359 slepc 301
  ierr = PetscObjectQueryFunction((PetscObject)svd,"SVDTRLanczosSetOneSide_C",(void (**)())&f);CHKERRQ(ierr);
1298 slepc 302
  if (f) {
303
    ierr = (*f)(svd,oneside);CHKERRQ(ierr);
304
  }
305
  PetscFunctionReturn(0);
306
}
307
 
308
#undef __FUNCT__  
309
#define __FUNCT__ "SVDView_TRLANCZOS"
310
PetscErrorCode SVDView_TRLANCZOS(SVD svd,PetscViewer viewer)
311
{
312
  PetscErrorCode ierr;
313
  SVD_TRLANCZOS  *lanczos = (SVD_TRLANCZOS *)svd->data;
314
 
315
  PetscFunctionBegin;
316
  ierr = PetscViewerASCIIPrintf(viewer,"Lanczos reorthogonalization: %s\n",lanczos->oneside ? "one-side" : "two-side");CHKERRQ(ierr);
317
  PetscFunctionReturn(0);
318
}
319
 
320
EXTERN_C_BEGIN
321
#undef __FUNCT__  
322
#define __FUNCT__ "SVDCreate_TRLANCZOS"
323
PetscErrorCode SVDCreate_TRLANCZOS(SVD svd)
324
{
325
  PetscErrorCode ierr;
326
  SVD_TRLANCZOS  *lanczos;
327
 
328
  PetscFunctionBegin;
329
  ierr = PetscNew(SVD_TRLANCZOS,&lanczos);CHKERRQ(ierr);
330
  PetscLogObjectMemory(svd,sizeof(SVD_TRLANCZOS));
331
  svd->data                = (void *)lanczos;
332
  svd->ops->setup          = SVDSetUp_TRLANCZOS;
333
  svd->ops->solve          = SVDSolve_TRLANCZOS;
334
  svd->ops->setfromoptions = SVDSetFromOptions_TRLANCZOS;
335
  svd->ops->view           = SVDView_TRLANCZOS;
336
  lanczos->oneside         = PETSC_FALSE;
1359 slepc 337
  ierr = PetscObjectComposeFunctionDynamic((PetscObject)svd,"SVDTRLanczosSetOneSide_C","SVDTRLanczosSetOneSide_TRLANCZOS",SVDTRLanczosSetOneSide_TRLANCZOS);CHKERRQ(ierr);
1298 slepc 338
  PetscFunctionReturn(0);
339
}
340
EXTERN_C_END