230 SUBROUTINE chetrd_hb2st( STAGE1, VECT, UPLO, N, KD, AB, LDAB,
231 $ D, E, HOUS, LHOUS, WORK, LWORK, INFO )
246 CHARACTER STAGE1, UPLO, VECT
247 INTEGER N, KD, LDAB, LHOUS, LWORK, INFO
251 COMPLEX AB( LDAB, * ), HOUS( * ), WORK( * )
259 parameter( rzero = 0.0e+0,
260 $ zero = ( 0.0e+0, 0.0e+0 ),
261 $ one = ( 1.0e+0, 0.0e+0 ) )
264 LOGICAL LQUERY, WANTQ, UPPER, AFTERS1
265 INTEGER I, M, K, IB, SWEEPID, MYID, SHIFT, STT, ST,
266 $ ed, stind, edind, blklastind, colpt, thed,
267 $ stepercol, grsiz, thgrsiz, thgrnb, thgrid,
268 $ nbtiles, ttype, tid, nthreads, debug,
269 $ abdpos, abofdpos, dpos, ofdpos, awpos,
270 $ inda, indw, apos, sizea, lda, indv, indtau,
271 $ sicev, sizetau, ldv, lhmin, lwmin
279 INTRINSIC min, max, ceiling, real
284 EXTERNAL lsame, ilaenv2stage
293 afters1 = lsame( stage1,
'Y' )
294 wantq = lsame( vect,
'V' )
295 upper = lsame( uplo,
'U' )
296 lquery = ( lwork.EQ.-1 ) .OR. ( lhous.EQ.-1 )
300 ib = ilaenv2stage( 2,
'CHETRD_HB2ST', vect, n, kd, -1, -1 )
301 lhmin = ilaenv2stage( 3,
'CHETRD_HB2ST', vect, n, kd, ib, -1 )
302 lwmin = ilaenv2stage( 4,
'CHETRD_HB2ST', vect, n, kd, ib, -1 )
304 IF( .NOT.afters1 .AND. .NOT.lsame( stage1,
'N' ) )
THEN
306 ELSE IF( .NOT.lsame( vect,
'N' ) )
THEN
308 ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo,
'L' ) )
THEN
310 ELSE IF( n.LT.0 )
THEN
312 ELSE IF( kd.LT.0 )
THEN
314 ELSE IF( ldab.LT.(kd+1) )
THEN
316 ELSE IF( lhous.LT.lhmin .AND. .NOT.lquery )
THEN
318 ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery )
THEN
328 CALL xerbla(
'CHETRD_HB2ST', -info )
330 ELSE IF( lquery )
THEN
348 indv = indtau + sizetau
365 awpos = inda + kd + 1
381 d( i ) = real( ab( abdpos, i ) )
404 d( i ) = real( ab( abdpos, i ) )
411 tmp = ab( abofdpos, i+1 )
413 ab( abofdpos, i+1 ) = abstmp
415 IF( abstmp.NE.rzero )
THEN
421 $ ab( abofdpos, i+2 ) = ab( abofdpos, i+2 )*tmp
428 tmp = ab( abofdpos, i )
430 ab( abofdpos, i ) = abstmp
432 IF( abstmp.NE.rzero )
THEN
438 $ ab( abofdpos, i+1 ) = ab( abofdpos, i+1 )*tmp
456 nbtiles = ceiling( real(n)/real(kd) )
457 stepercol = ceiling( real(shift)/real(grsiz) )
458 thgrnb = ceiling( real(n-1)/real(thgrsiz) )
460 CALL clacpy(
"A", kd+1, n, ab, ldab, work( apos ), lda )
461 CALL claset(
"A", kd, n, zero, zero, work( awpos ), lda )
478 DO 100 thgrid = 1, thgrnb
479 stt = (thgrid-1)*thgrsiz+1
480 thed = min( (stt + thgrsiz -1), (n-1))
484 DO 120 m = 1, stepercol
486 DO 130 sweepid = st, ed
488 myid = (i-sweepid)*(stepercol*grsiz)
490 IF ( myid.EQ.1 )
THEN
493 ttype = mod( myid, 2 ) + 2
496 IF( ttype.EQ.2 )
THEN
497 colpt = (myid/2)*kd + sweepid
502 colpt = ((myid+1)/2)*kd + sweepid
505 IF( ( stind.GE.edind-1 ).AND.
506 $ ( edind.EQ.n ) )
THEN
516 IF( ttype.NE.1 )
THEN
520 tid = omp_get_thread_num()
522 $ stind, edind, sweepid, n, kd, ib,
524 $ hous( indv ), hous( indtau ), ldv,
525 $ work( indw + tid*kd ) )
530 tid = omp_get_thread_num()
532 $ stind, edind, sweepid, n, kd, ib,
534 $ hous( indv ), hous( indtau ), ldv,
535 $ work( indw + tid*kd ) )
540 $ stind, edind, sweepid, n, kd, ib,
542 $ hous( indv ), hous( indtau ), ldv,
543 $ work( indw + tid*kd ) )
545 IF ( blklastind.GE.(n-1) )
THEN
564 d( i ) = real( work( dpos+(i-1)*lda ) )
572 e( i ) = real( work( ofdpos+i*lda ) )
576 e( i ) = real( work( ofdpos+(i-1)*lda ) )