Add Dsytrd and tests

2025-10-20 21:59:25 +08:00 · 2016-02-09 21:39:50 -07:00
parent 29eff129d1
commit fe0ba91d41
3 changed files with 234 additions and 0 deletions
--- a/native/dsytrd.go
+++ b/native/dsytrd.go
@@ -0,0 +1,150 @@
 // Copyright ©2016 The gonum Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 package native
 import (
 	"github.com/gonum/blas"
 	"github.com/gonum/blas/blas64"
 )
 // Dsytrd reduces a symmetric n×n matrix A to symmetric tridiagonal form by an
 // orthogonal similarity transformation
 //  Q^T * A * Q = T
 // where Q is an orthonormal matrix and T is symmetric and tridiagonal.
 //
 // On entry, a contains the elements of the input matrix in the triangle specified
 // by uplo. On exit, the diagonal and sub/super-diagonal are overwritten by the
 // corresponding elements of the tridiagonal matrix T. The remaining elements in
 // the triangle, along with the array tau, contain the data to construct Q as
 // the product of elementary reflectors.
 //
 // If uplo == blas.Upper, Q is constructed with
 //  Q = H[n-2] * ... * H[1] * H[0]
 // where
 //  H[i] = I - tau * v * v^T
 // v is constructed as v[i+1:n] = 0, v[i] = 1, v[0:i-1] is stored in A[0:i-1, i+1],
 // and tau is in tau[i]. The elements of A are
 //  [ d  e  v2 v3 v4]
 //  [    d  e  v3 v4]
 //  [       d   e v4]
 //  [           d  e]
 //  [              e]
 //
 // If uplo == blas.Lower, Q is constructed with
 //  Q = H[0] * H[1] * ... * H[n-2]
 // where
 //  H[i] = I - tau * v * v^T
 // v is constructed as v[0:i+1] = 0, v[i+1] = 1, v[i+2:n] is stored in A[i+2:n, i],
 // and tau is in tau[i]. The elements of A are
 //  [ d            ]
 //  [ e  d         ]
 //  [v1  e  d      ]
 //  [v1 v2  e  d   ]
 //  [v1 v2  v3 e  d]
 //
 // d must have length n, and e and tau must have length n-1. Dsytrd will panic if
 // these conditions are not met.
 //
 // work is temporary storage, and lwork specifies the usable memory length. At minimum,
 // lwork >= 1, and Dsytrd will panic otherwise. The amount of blocking is
 // limited by the usable length.
 // If lwork == -1, instead of computing Dsytrd the optimal work length is stored
 // into work[0].
 func (impl Implementation) Dsytrd(uplo blas.Uplo, n int, a []float64, lda int, d, e, tau, work []float64, lwork int) {
 	upper := uplo == blas.Upper
 	opts := "U"
 	if !upper {
 		opts = "L"
 	}
 	nb := impl.Ilaenv(1, "DSYTRD", opts, n, -1, -1, -1)
 	lworkopt := n * nb
 	work[0] = float64(lworkopt)
 	if lwork == -1 {
 		return
 	}
 	if n == 0 {
 		work[0] = 1
 	}
 	nx := n
 	bi := blas64.Implementation()
 	var ldwork int
 	if nb > 1 && nb < n {
 		// Determine when to cross over from blocked to unblocked code. The last
 		// block is always handled by unblocked code.
 		opts := "L"
 		if upper {
 			opts = "U"
 		}
 		nx = max(nb, impl.Ilaenv(3, "DSYTRD", opts, n, -1, -1, -1))
 		if nx < n {
 			// Determine if workspace is large enough for blocked code.
 			ldwork = nb
 			iws := n * ldwork
 			if lwork < iws {
 				// Not enough workspace to use optimal nb: determine the minimum
 				// value of nb and reduce nb or force use of unblocked code by
 				// setting nx = n.
 				nb = max(lwork/n, 1)
 				nbmin := impl.Ilaenv(2, "DSYTRD", opts, n, -1, -1, -1)
 				if nb < nbmin {
 					nx = n
 				}
 			}
 		} else {
 			nx = n
 		}
 	} else {
 		nb = 1
 	}
 	ldwork = nb
 	if upper {
 		// Reduce the upper triangle of A. Columns 0:kk are handled by the
 		// unblocked method.
 		var i int
 		kk := n - ((n-nx+nb-1)/nb)*nb
 		for i = n - nb; i >= kk; i -= nb {
 			// Reduce columns i:i+nb to tridiagonal form and form the matrix W
 			// which is needed to update the unreduced part of the matrix.
 			impl.Dlatrd(uplo, i+nb, nb, a, lda, e, tau, work, ldwork)
 			// Update the unreduced submatrix A[0:i-1,0:i-1], using an update
 			// of the form A = A - V*W^T - W*V^T.
 			bi.Dsyr2k(uplo, blas.NoTrans, i, nb, -1, a[i:], lda, work, ldwork, 1, a, lda)
 			// Copy superdiagonal elements back into A, and diagonal elements into D.
 			for j := i; j < i+nb; j++ {
 				a[(j-1)*lda+j] = e[j-1]
 				d[j] = a[j*lda+j]
 			}
 		}
 		// Use unblocked code to reduce the last or only block
 		// check that i == kk.
 		impl.Dsytd2(uplo, kk, a, lda, d, e, tau)
 	} else {
 		var i int
 		// Reduce the lower triangle of A.
 		for i = 0; i < n-nx; i += nb {
 			// Reduce columns 0:i+nb to tridiagonal form and form the matrix W
 			// which is needed to update the unreduced part of the matrix.
 			impl.Dlatrd(uplo, n-i, nb, a[i*lda+i:], lda, e[i:], tau[i:], work, ldwork)
 			// Update the unreduced submatrix A[i+ib:n, i+ib:n], using an update
 			// of the form A = A + V*W^T - W*V^T.
 			bi.Dsyr2k(uplo, blas.NoTrans, n-i-nb, nb, -1, a[(i+nb)*lda+i:], lda,
 				work[nb+i:], ldwork, 1, a[(i+nb)*lda+i+nb:], lda)
 			// Copy subdiagonal elements back into A, and diagonal elements into D.
 			for j := i; j < i+nb; j++ {
 				a[(j+1)*lda+j] = e[j]
 				d[j] = a[j*lda+j]
 			}
 		}
 		// Use unblocked code to reduce the last or only block.
 		impl.Dsytd2(uplo, n-i, a[i*lda+i:], lda, d[i:], e[i:], tau[i:])
 	}
 	work[0] = float64(lworkopt)
 }
--- a/native/lapack_test.go
+++ b/native/lapack_test.go
@@ -220,6 +220,10 @@ func TestDsytd2(t *testing.T) {
 	testlapack.Dsytd2Test(t, impl)
 }
 func TestDsytrd(t *testing.T) {
 	testlapack.DsytrdTest(t, impl)
 }
 func TestDtrcon(t *testing.T) {
 	testlapack.DtrconTest(t, impl)
 }
--- a/testlapack/dsytrd.go
+++ b/testlapack/dsytrd.go
@@ -0,0 +1,80 @@
 // Copyright ©2016 The gonum Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 package testlapack
 import (
 	"fmt"
 	"math/rand"
 	"testing"
 	"github.com/gonum/blas"
 	"github.com/gonum/floats"
 )
 type Dsytrder interface {
 	Dsytrd(uplo blas.Uplo, n int, a []float64, lda int, d, e, tau, work []float64, lwork int)
 	Dsytd2er
 }
 func DsytrdTest(t *testing.T, impl Dsytrder) {
 	for _, uplo := range []blas.Uplo{blas.Upper} {
 		for _, test := range []struct {
 			n, lda int
 		}{
 			{10, 0},
 			{50, 0},
 			{100, 0},
 			{150, 0},
 			{300, 0},
 			{10, 20},
 			{50, 70},
 			{100, 120},
 			{150, 170},
 			{300, 320},
 		} {
 			n := test.n
 			lda := test.lda
 			if lda == 0 {
 				lda = n
 			}
 			a := make([]float64, n*lda)
 			for i := range a {
 				a[i] = rand.NormFloat64()
 			}
 			d2 := make([]float64, n)
 			e2 := make([]float64, n)
 			tau2 := make([]float64, n)
 			aCopy := make([]float64, len(a))
 			copy(aCopy, a)
 			impl.Dsytd2(uplo, n, a, lda, d2, e2, tau2)
 			aAns := make([]float64, len(a))
 			copy(aAns, a)
 			copy(a, aCopy)
 			d := make([]float64, n)
 			e := make([]float64, n)
 			tau := make([]float64, n)
 			work := make([]float64, 1)
 			impl.Dsytrd(uplo, n, a, lda, d, e, tau, work, -1)
 			work = make([]float64, int(work[0]))
 			impl.Dsytrd(uplo, n, a, lda, d, e, tau, work, len(work))
 			errStr := fmt.Sprintf("upper = %v, n = %v", uplo == blas.Upper, n)
 			if !floats.EqualApprox(a, aAns, 1e-8) {
 				t.Errorf("A mismatch: %s", errStr)
 			}
 			if !floats.EqualApprox(d, d2, 1e-8) {
 				t.Errorf("D mismatch: %s", errStr)
 			}
 			if !floats.EqualApprox(e, e2, 1e-8) {
 				t.Errorf("E mismatch: %s", errStr)
 			}
 			if !floats.EqualApprox(tau, tau2, 1e-8) {
 				t.Errorf("Tau mismatch: %s", errStr)
 			}
 		}
 	}
 }