From 296a71be684afc7e67963aae46b2dfa420397417 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Tue, 11 Oct 2022 18:20:09 +0200
Subject: [PATCH 01/14] rebase

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 230 ++++++++++++
 tests/smoke/CMakeLists.txt                    |   4 +
 tests/smoke/alp_stedc.cpp                     | 344 ++++++++++++++++++
 3 files changed, 578 insertions(+)
 create mode 100644 include/alp/algorithms/symm_tridiag_eigensolver.hpp
 create mode 100644 tests/smoke/alp_stedc.cpp
diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
new file mode 100644
index 000000000..61c4c2af2
--- /dev/null
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -0,0 +1,230 @@
+/*
+ *   Copyright 2021 Huawei Technologies Co., Ltd.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <iostream>
+#include <sstream>
+
+#include <alp.hpp>
+#include <graphblas/utils/iscomplex.hpp> // use from grb
+#include "../tests/utils/print_alp_containers.hpp"
+
+namespace alp {
+
+	namespace algorithms {
+
+		/**
+		 * Calcualte eigendecomposition of symmetric tridiagonal matrix T
+		 *        \f$T = Qdiag(d)Q^T\f$ where
+		 *        \a T is real symmetric tridiagonal
+		 *        \a Q is orthogonal (columns are eigenvectors).
+		 *        \a d is vector containing eigenvalues.
+		 *
+		 * @tparam D        Data element type
+		 * @tparam Ring     Type of the semiring used in the computation
+		 * @tparam Minus    Type minus operator used in the computation
+		 * @tparam Divide   Type of divide operator used in the computation
+		 * @param[out] Q    output orthogonal matrix contaning eigenvectors
+		 * @param[out] d    output vector containg eigenvalues
+		 * @param[in]  T    input symmetric tridiagonal matrix
+		 * @param[in]  ring A semiring for operations
+		 * @return RC       SUCCESS if the execution was correct
+		 *
+		 */
+		template<
+			typename D,
+			typename SymmOrHermTridiagonalType,
+			typename OrthogonalType,
+			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
+			class Minus = operators::subtract< D >,
+			class Divide = operators::divide< D >
+		>
+		RC symm_tridiag_eigensolver(
+			Matrix< D, SymmOrHermTridiagonalType, Dense > T,
+			Matrix< D, OrthogonalType, Dense > &Q,
+			Vector< D, structures::General, Dense > &d,
+			const Ring & ring = Ring(),
+			const Minus & minus = Minus(),
+			const Divide & divide = Divide() ) {
+
+			RC rc = SUCCESS;
+
+// 			const Scalar< D > zero( ring.template getZero< D >() );
+// 			const Scalar< D > one( ring.template getOne< D >() );
+// 			const size_t n = nrows( H );
+
+// 			// Q = identity( n )
+// 			rc = alp::set( Q, zero );
+// 			auto Qdiag = alp::get_view< alp::view::diagonal >( Q );
+// 			rc = rc ? rc : alp::set( Qdiag, one );
+// 			if( rc != SUCCESS ) {
+// 				std::cerr << " set( Q, I ) failed\n";
+// 				return rc;
+// 			}
+
+// 			// Out of place specification of the computation
+// 			Matrix< D, SymmOrHermType, Dense > RR( n );
+
+// 			rc = set( RR, H );
+// 			if( rc != SUCCESS ) {
+// 				std::cerr << " set( RR, H ) failed\n";
+// 				return rc;
+// 			}
+// #ifdef DEBUG
+// 			print_matrix( " << RR >> ", RR );
+// #endif
+
+// 			// a temporary for storing the mxm result
+// 			Matrix< D, OrthogonalType, Dense > Qtmp( n, n );
+
+// 			for( size_t k = 0; k < n - 2; ++k ) {
+// #ifdef DEBUG
+// 				std::string matname(" << RR(");
+// 				matname = matname + std::to_string(k);
+// 				matname = matname + std::string( ") >> ");
+// 				print_matrix( matname , RR );
+// #endif
+
+// 				const size_t m = n - k - 1;
+
+// 				// ===== Begin Computing v =====
+// 				// v = H[ k + 1 : , k ]
+// 				// alpha = norm( v ) * v[ 0 ] / norm( v[ 0 ] )
+// 				// v = v - alpha * e1
+// 				// v = v / norm ( v )
+
+// 				auto v_view = get_view( RR, k, utils::range( k + 1, n ) );
+// 				Vector< D, structures::General, Dense > v( n - ( k + 1 ) );
+// 				rc = set( v, v_view );
+// 				if( rc != SUCCESS ) {
+// 					std::cerr << " set( v, view ) failed\n";
+// 					return rc;
+// 				}
+
+// 				Scalar< D > alpha( zero );
+// 				rc = norm2( alpha, v, ring );
+// 				if( rc != SUCCESS ) {
+// 					std::cerr << " norm2( alpha, v, ring ) failed\n";
+// 					return rc;
+// 				}
+
+// 				rc = eWiseLambda(
+// 					[ &alpha, &ring, &divide, &minus ]( const size_t i, D &val ) {
+// 						if ( i == 0 ) {
+// 							Scalar< D > norm_v0( std::abs( val ) );
+// 							Scalar< D > val_scalar( val );
+// 							foldl( alpha, val_scalar, ring.getMultiplicativeOperator() );
+// 							foldl( alpha, norm_v0, divide );
+// 							foldl( val_scalar, alpha, minus );
+// 							val = *val_scalar;
+// 						}
+// 					},
+// 					v
+// 				);
+// 				if( rc != SUCCESS ) {
+// 					std::cerr << " eWiseLambda( lambda, v ) failed\n";
+// 					return rc;
+// 				}
+
+// 				Scalar< D > norm_v( zero );
+// 				rc = norm2( norm_v, v, ring );
+// 				if( rc != SUCCESS ) {
+// 					std::cerr << " norm2( norm_v, v, ring ) failed\n";
+// 					return rc;
+// 				}
+
+// 				rc = foldl(v, norm_v, divide );
+// #ifdef DEBUG
+// 				print_vector( " v = ", v );
+// #endif
+// 				// ===== End Computing v =====
+
+// 				// ===== Calculate reflector Qk =====
+// 				// Q_k = identity( n )
+// 				Matrix< D, SymmOrHermType, Dense > Qk( n );
+// 				rc = alp::set( Qk, zero );
+// 				auto Qk_diag = alp::get_view< alp::view::diagonal >( Qk );
+// 				rc = rc ? rc : alp::set( Qk_diag, one );
+
+// 				// this part can be rewriten without temp matrix using functors
+// 				Matrix< D, SymmOrHermType, Dense > vvt( m );
+
+// 				rc = rc ? rc : set( vvt, outer( v, ring.getMultiplicativeOperator() ) );
+// 				// vvt = 2 * vvt
+// 				rc = rc ? rc : foldr( Scalar< D >( 2 ), vvt, ring.getMultiplicativeOperator() );
+
+
+// #ifdef DEBUG
+// 				print_matrix( " vvt ", vvt );
+// #endif
+
+// 				// Qk = Qk - vvt ( expanded: I - 2 * vvt )
+// 				auto Qk_view = get_view< SymmOrHermType >( Qk, utils::range( k + 1, n ), utils::range( k + 1, n ) );
+// 				if ( grb::utils::is_complex< D >::value ) {
+// 					rc = rc ? rc : foldl( Qk_view, alp::get_view< alp::view::transpose >( vvt ), minus );
+// 				} else {
+// 					rc = rc ? rc : foldl( Qk_view, vvt, minus );
+// 				}
+
+// #ifdef DEBUG
+// 				print_matrix( " << Qk >> ", Qk );
+// #endif
+// 				// ===== End of Calculate reflector Qk ====
+
+// 				// ===== Update R =====
+// 				// Rk = Qk * Rk * Qk
+
+// 				// RRQk = RR * Qk
+// 				Matrix< D, structures::Square, Dense > RRQk( n );
+// 				rc = rc ? rc : set( RRQk, zero );
+// 				rc = rc ? rc : mxm( RRQk, RR, Qk, ring );
+// 				if( rc != SUCCESS ) {
+// 					std::cerr << " mxm( RRQk, RR, Qk, ring ); failed\n";
+// 					return rc;
+// 				}
+// #ifdef DEBUG
+// 				print_matrix( " << RR x Qk = >> ", RRQk );
+// #endif
+// 				// RR = Qk * RRQk
+// 				rc = rc ? rc : set( RR, zero );
+// 				rc = rc ? rc : mxm( RR, Qk, RRQk, ring );
+
+// #ifdef DEBUG
+// 				print_matrix( " << RR( updated ) >> ", RR );
+// #endif
+// 				// ===== End of Update R =====
+
+// 				// ===== Update Q =====
+// 				// Q = Q * Qk
+
+// 				// Qtmp = Q * Qk
+// 				rc = rc ? rc : set( Qtmp, zero );
+// 				rc = rc ? rc : mxm( Qtmp, Q, Qk, ring );
+
+// 				// Q = Qtmp
+// 				rc = rc ? rc : set( Q, Qtmp );
+// #ifdef DEBUG
+// 				print_matrix( " << Q updated >> ", Q );
+// #endif
+// 				// ===== End of Update Q =====
+// 			}
+
+// 			// T = RR
+
+// 			rc = rc ? rc : set( T, get_view< SymmOrHermTridiagonalType > ( RR ) );
+			return rc;
+		}
+	} // namespace algorithms
+} // namespace alp
diff --git a/tests/smoke/CMakeLists.txt b/tests/smoke/CMakeLists.txt
index 7dd766712..16200d0fc 100644
--- a/tests/smoke/CMakeLists.txt
+++ b/tests/smoke/CMakeLists.txt
@@ -185,6 +185,10 @@ add_grb_executables( alp_zgeqrf_complex alp_zgeqrf.cpp
 	COMPILE_DEFINITIONS _COMPLEX
 )
 
+add_grb_executables( alp_stedc alp_stedc.cpp
+        BACKENDS alp_reference
+)
+
 # targets to list and build the test for this category
 get_property( smoke_tests_list GLOBAL PROPERTY tests_category_smoke )
 add_custom_target( "list_tests_category_smoke"
diff --git a/tests/smoke/alp_stedc.cpp b/tests/smoke/alp_stedc.cpp
new file mode 100644
index 000000000..742893d76
--- /dev/null
+++ b/tests/smoke/alp_stedc.cpp
@@ -0,0 +1,344 @@
+/*
+ *   Copyright 2021 Huawei Technologies Co., Ltd.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <iostream>
+#include <sstream>
+#include <vector>
+
+// currently only real version
+// #ifdef _COMPLEX
+// #include <complex>
+// #include <cmath>
+// #include <iomanip>
+// #endif
+
+#define DEBUG
+
+#include <alp.hpp>
+#include <alp/algorithms/symm_tridiag_eigensolver.hpp>
+#include <graphblas/utils/iscomplex.hpp> // use from grb
+#include "../utils/print_alp_containers.hpp"
+
+//once TEMPDISABLE is removed the code should be in the final version
+#define TEMPDISABLE
+
+using namespace alp;
+
+using BaseScalarType = double;
+using Orthogonal = structures::Orthogonal;
+
+// #ifdef _COMPLEX
+// using ScalarType = std::complex< BaseScalarType >;
+// //not fully implemented structures
+// using HermitianOrSymmetricTridiagonal = structures::HermitianTridiagonal;
+// using HermitianOrSymmetric = structures::Hermitian;
+// #else
+using ScalarType = BaseScalarType;
+using HermitianOrSymmetricTridiagonal = structures::SymmetricTridiagonal;
+//fully implemented structures
+using HermitianOrSymmetric = structures::Symmetric;
+// #endif
+
+constexpr BaseScalarType tol = 1.e-10;
+constexpr size_t RNDSEED = 1;
+
+//temp function untill Hermitian containter is implemented
+//** gnerate symmetric-hermitian matrix in a square container */
+template<
+	typename T
+>
+std::vector< T > generate_symmherm_tridiag_matrix_data(
+	size_t N,
+	const typename std::enable_if<
+		grb::utils::is_complex< T >::value,
+		void
+	>::type * const = nullptr
+) {
+	std::vector< T > data( N * N );
+	std::fill(data.begin(), data.end(), static_cast< T >( 0 ) );
+	std::srand( RNDSEED );
+	for( size_t i = 0; i < N; ++i ) {
+		for( size_t j = i; ( j < N ) && ( j <= i + 1 ); ++j ) {
+			T val( std::rand(), std::rand() );
+			data[ i * N + j ] = val / std::abs( val );
+			data[ j * N + i ] += grb::utils::is_complex< T >::conjugate( data[ i * N + j ] );
+		}
+	}
+	return data;
+}
+
+//** generate upper/lower triangular part of a Symmetric matrix */
+template<
+	typename T
+>
+std::vector< T >  generate_symmherm_tridiag_matrix_data(
+	size_t N,
+	const typename std::enable_if<
+		!grb::utils::is_complex< T >::value,
+		void
+	>::type * const = nullptr
+) {
+	std::vector< T > data( N * N );
+	std::srand( RNDSEED );
+	for( size_t i = 0; i < N; ++i ) {
+		for( size_t j = i; ( j < N ) && ( j <= i + 1 ); ++j ) {
+			T val = static_cast< T >( std::rand() )  / RAND_MAX;
+			data[ i * N + j ] = val;
+			data[ j * N + i ] += grb::utils::is_complex< T >::conjugate( data[ i * N + j ] );
+		}
+	}
+	return data;
+}
+
+// //** check if rows/columns or matrix Q are orthogonal */
+// template<
+// 	typename T,
+// 	typename Structure,
+// 	typename ViewType,
+// 	class Ring = Semiring< operators::add< T >, operators::mul< T >, identities::zero, identities::one >
+// >
+// RC check_overlap( alp::Matrix< T, Structure, alp::Density::Dense, ViewType > &Q, const Ring & ring = Ring() ) {
+// 	RC rc = SUCCESS;
+// 	const size_t n = nrows( Q );
+// #ifdef DEBUG
+// 	std::cout << "Overlap matrix for Q:\n";
+// #endif
+// 	for ( size_t i = 0; i < n; ++i ) {
+// 		auto vi = get_view( Q, i, utils::range( 0, n ) );
+// 		for ( size_t j = 0; j < n; ++j ) {
+// 			auto vj = get_view( Q, j, utils::range( 0, n ) );
+// 			Scalar< T > alpha( ring.template getZero< T >() );
+// 			rc = dot( alpha, vi, vj, ring );
+// 			if( rc != SUCCESS ) {
+// 				std::cerr << " dot( alpha, vi, vj, ring ) failed\n";
+// 				return PANIC;
+// 			}
+// 			if( i == j ) {
+// 				if( std::abs( *alpha - ring.template getOne< T >() ) > tol ) {
+// 					std::cerr << " vector " << i << " not normalized\n";
+// 					return PANIC;
+// 				}
+// 			} else {
+// 				if( std::abs( *alpha ) > tol ) {
+// 					std::cerr << " vector " << i << " and vctor " << j << " are note orthogonal\n";
+// 					return PANIC;
+// 				}
+// 			}
+// #ifdef DEBUG
+// 			std::cout << "\t" << std::abs( *alpha );
+// #endif
+// 		}
+// #ifdef DEBUG
+// 		std::cout << "\n";
+// #endif
+// 	}
+// #ifdef DEBUG
+// 	std::cout << "\n";
+// #endif
+// 	return rc;
+// }
+
+
+// //** check solution by calculating H-QTQh */
+// template<
+// 	typename D,
+// 	typename StructureSymm,
+// 	typename StructureOrth,
+// 	typename StructureTrDg,
+// 	class Minus = operators::subtract< D >,
+// 	class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >
+// >
+// RC check_solution(
+// 	alp::Matrix< D, StructureSymm, alp::Density::Dense > &H,
+// 	alp::Matrix< D, StructureOrth, alp::Density::Dense > &Q,
+// 	alp::Matrix< D, StructureTrDg, alp::Density::Dense > &T,
+// 	const Ring &ring = Ring(),
+// 	const Minus &minus = Minus()
+// ) {
+// 	RC rc = SUCCESS;
+// 	const size_t n = nrows( Q );
+
+// #ifdef DEBUG
+// 	std::cout << " ** check_solution **\n";
+// 	std::cout << " input matrices:\n";
+// 	print_matrix( " << H >> ", H );
+// 	print_matrix( " << Q >> ", Q );
+// 	print_matrix( " << T >> ", T );
+// 	std::cout << " ********************\n";
+// #endif
+
+// 	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > QTQh( n );
+// 	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > QTQhmH( n );
+// 	const Scalar< D > zero( ring.template getZero< D >() );
+
+// 	rc = rc ? rc : set( QTQh, zero );
+// 	rc = rc ? rc : mxm( QTQh, T, conjugate( alp::get_view< alp::view::transpose >( Q ) ), ring );
+// 	rc = rc ? rc : set( QTQhmH, zero );
+// 	rc = rc ? rc : mxm( QTQhmH, Q, QTQh, ring );
+// 	rc = rc ? rc : set( QTQh, QTQhmH );
+// #ifdef DEBUG
+// 	print_matrix( " << QTQhmH >> ", QTQhmH );
+// 	print_matrix( " << H >> ", H );
+// 	std::cout << "call foldl( mat, mat, minus )\n";
+// #endif
+
+// #ifndef TEMPDISABLE
+// 	rc = foldl( QTQhmH, H, minus );
+// #else
+// 	rc = rc ? rc : alp::eWiseLambda(
+// 		[ &H, &minus, &zero ]( const size_t i, const size_t j, D &val ) {
+// 			if ( j >= i ) {
+// 				internal::foldl(
+// 					val,
+// 					internal::access( H, internal::getStorageIndex( H, i, j ) ),
+// 					minus
+// 				);
+// 			} else {
+// 				val = *zero;
+// 			}
+// 		},
+// 		QTQhmH
+// 	);
+// #endif
+
+// #ifdef DEBUG
+// 	print_matrix( " << QTQhmH >> ", QTQhmH );
+// 	print_matrix( " << H >> ", H );
+// #endif
+
+// 	//Frobenius norm
+// 	D fnorm = ring.template getZero< D >();
+// 	rc = rc ? rc : alp::eWiseLambda(
+// 		[ &fnorm, &ring ]( const size_t i, const size_t j, D &val ) {
+// 			(void) i;
+// 			(void) j;
+// 			internal::foldl( fnorm, val * val, ring.getAdditiveOperator() );
+// 		},
+// 		QTQhmH
+// 	);
+// 	fnorm = std::sqrt( fnorm );
+
+// #ifdef DEBUG
+// 	std::cout << " FrobeniusNorm(H-QTQh) = " << std::abs( fnorm ) << "\n";
+// #endif
+// 	if( tol < std::abs( fnorm ) ) {
+// #ifdef DEBUG
+// 		std::cout << " ----------------------\n";
+// 		std::cout << " compare matrices\n";
+// 		print_matrix( " << H >> ", H );
+// 		print_matrix( " << QTQh >> ", QTQh );
+// 		std::cout << " ----------------------\n";
+// #endif
+// 		std::cout << "The Frobenius norm is too large.\n";
+// 		return FAILED;
+// 	}
+
+// 	return rc;
+// }
+
+
+
+void alp_program( const size_t & unit, alp::RC & rc ) {
+	rc = SUCCESS;
+
+	alp::Semiring<
+		alp::operators::add< ScalarType >,
+		alp::operators::mul< ScalarType >,
+		alp::identities::zero,
+		alp::identities::one
+	> ring;
+
+	// dimensions of sqare matrices H, Q and R
+	size_t N = unit;
+
+	alp::Matrix< ScalarType, Orthogonal > Q( N );
+	alp::Matrix< ScalarType, HermitianOrSymmetricTridiagonal > T( N );
+	// Vector< ScalarType, structures::General, Dense > d( N );
+	Vector< ScalarType, structures::General, Dense > d( N );
+	{
+		auto matrix_data = generate_symmherm_tridiag_matrix_data< ScalarType >( N );
+		rc = rc ? rc : alp::buildMatrix( T, matrix_data.begin(), matrix_data.end() );
+	}
+#ifdef DEBUG
+	print_matrix( " input matrix T ", T );
+#endif
+
+  	rc = rc ? rc : algorithms::symm_tridiag_eigensolver( T, Q, d );
+
+
+// #ifdef DEBUG
+// 	print_matrix( " << Q >> ", Q );
+// 	print_matrix( " << T >> ", T );
+// #endif
+
+// 	rc = check_overlap( Q );
+// 	if( rc != SUCCESS ) {
+// 		std::cout << "Error: mratrix Q is not orthogonal\n";
+// 	}
+
+// 	rc = check_solution( H, Q, T );
+// 	if( rc != SUCCESS ) {
+// 		std::cout << "Error: solution numerically wrong\n";
+// 	}
+}
+
+int main( int argc, char ** argv ) {
+	// defaults
+	bool printUsage = false;
+	size_t in = 5;
+
+	// error checking
+	if( argc > 2 ) {
+		printUsage = true;
+	}
+	if( argc == 2 ) {
+		size_t read;
+		std::istringstream ss( argv[ 1 ] );
+		if( ! ( ss >> read ) ) {
+			std::cerr << "Error parsing first argument\n";
+			printUsage = true;
+		} else if( ! ss.eof() ) {
+			std::cerr << "Error parsing first argument\n";
+			printUsage = true;
+		} else if( read % 2 != 0 ) {
+			std::cerr << "Given value for n is odd\n";
+			printUsage = true;
+		} else {
+			// all OK
+			in = read;
+		}
+	}
+	if( printUsage ) {
+		std::cerr << "Usage: " << argv[ 0 ] << " [n]\n";
+		std::cerr << "  -n (optional, default is 100): an even integer, the "
+					 "test size.\n";
+		return 1;
+	}
+
+	std::cout << "This is functional test " << argv[ 0 ] << "\n";
+	alp::Launcher< AUTOMATIC > launcher;
+	alp::RC out;
+	if( launcher.exec( &alp_program, in, out, true ) != SUCCESS ) {
+		std::cerr << "Launching test FAILED\n";
+		return 255;
+	}
+	if( out != SUCCESS ) {
+		std::cerr << "Test FAILED (" << alp::toString( out ) << ")" << std::endl;
+	} else {
+		std::cout << "Test OK" << std::endl;
+	}
+	return 0;
+}

From 9da194b8c88108a2df1632c071351852926965c0 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Thu, 13 Oct 2022 16:49:22 +0200
Subject: [PATCH 02/14] main part of the algorithm works

-added det_view for orthogonal and symmetrictridiagonal matrices

missing
- mxv
- divide and conquer (diag-outer) solver
- permute view
- sort
- ?
---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 421 +++++++++++-------
 include/alp/storage.hpp                       |  16 +-
 include/alp/structures.hpp                    |  16 +
 tests/smoke/alp_stedc.cpp                     |  24 +-
 4 files changed, 294 insertions(+), 183 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 61c4c2af2..1a341d869 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -21,6 +21,9 @@
 #include <graphblas/utils/iscomplex.hpp> // use from grb
 #include "../tests/utils/print_alp_containers.hpp"
 
+// TEMPDISABLE should be removed in the final version
+#define TEMPDISABLE
+
 namespace alp {
 
 	namespace algorithms {
@@ -47,183 +50,265 @@ namespace alp {
 			typename D,
 			typename SymmOrHermTridiagonalType,
 			typename OrthogonalType,
+			typename SymmHermTrdiViewType,
+			typename OrthViewType,
+			typename SymmHermTrdiImfR,
+			typename SymmHermTrdiImfC,
+			typename OrthViewImfR,
+			typename OrthViewImfC,
+			typename VecViewType,
+			typename VecImfR,
+			typename VecImfC,
 			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
 			class Minus = operators::subtract< D >,
 			class Divide = operators::divide< D >
 		>
-		RC symm_tridiag_eigensolver(
-			Matrix< D, SymmOrHermTridiagonalType, Dense > T,
-			Matrix< D, OrthogonalType, Dense > &Q,
-			Vector< D, structures::General, Dense > &d,
+		RC symm_tridiag_dac_eigensolver(
+			Matrix<
+				D,
+				SymmOrHermTridiagonalType,
+				Dense,
+				SymmHermTrdiViewType,
+				SymmHermTrdiImfR,
+				SymmHermTrdiImfC
+			> &T,
+			Matrix<
+				D,
+				OrthogonalType,
+				Dense,
+				OrthViewType,
+				OrthViewImfR,
+				OrthViewImfC
+			> &Q,
+			Vector<
+				D,
+				structures::General,
+				Dense,
+				VecViewType,
+				VecImfR,
+				VecImfC
+			> &d,
 			const Ring & ring = Ring(),
 			const Minus & minus = Minus(),
-			const Divide & divide = Divide() ) {
+			const Divide & divide = Divide()
+		) {
+			(void)ring;
+			(void)minus;
+			(void)divide;
+
+			const Scalar< D > zero( ring.template getZero< D >() );
+			const Scalar< D > one( ring.template getOne< D >() );
 
 			RC rc = SUCCESS;
 
-// 			const Scalar< D > zero( ring.template getZero< D >() );
-// 			const Scalar< D > one( ring.template getOne< D >() );
-// 			const size_t n = nrows( H );
-
-// 			// Q = identity( n )
-// 			rc = alp::set( Q, zero );
-// 			auto Qdiag = alp::get_view< alp::view::diagonal >( Q );
-// 			rc = rc ? rc : alp::set( Qdiag, one );
-// 			if( rc != SUCCESS ) {
-// 				std::cerr << " set( Q, I ) failed\n";
-// 				return rc;
-// 			}
-
-// 			// Out of place specification of the computation
-// 			Matrix< D, SymmOrHermType, Dense > RR( n );
-
-// 			rc = set( RR, H );
-// 			if( rc != SUCCESS ) {
-// 				std::cerr << " set( RR, H ) failed\n";
-// 				return rc;
-// 			}
-// #ifdef DEBUG
-// 			print_matrix( " << RR >> ", RR );
-// #endif
-
-// 			// a temporary for storing the mxm result
-// 			Matrix< D, OrthogonalType, Dense > Qtmp( n, n );
-
-// 			for( size_t k = 0; k < n - 2; ++k ) {
-// #ifdef DEBUG
-// 				std::string matname(" << RR(");
-// 				matname = matname + std::to_string(k);
-// 				matname = matname + std::string( ") >> ");
-// 				print_matrix( matname , RR );
-// #endif
-
-// 				const size_t m = n - k - 1;
-
-// 				// ===== Begin Computing v =====
-// 				// v = H[ k + 1 : , k ]
-// 				// alpha = norm( v ) * v[ 0 ] / norm( v[ 0 ] )
-// 				// v = v - alpha * e1
-// 				// v = v / norm ( v )
-
-// 				auto v_view = get_view( RR, k, utils::range( k + 1, n ) );
-// 				Vector< D, structures::General, Dense > v( n - ( k + 1 ) );
-// 				rc = set( v, v_view );
-// 				if( rc != SUCCESS ) {
-// 					std::cerr << " set( v, view ) failed\n";
-// 					return rc;
-// 				}
-
-// 				Scalar< D > alpha( zero );
-// 				rc = norm2( alpha, v, ring );
-// 				if( rc != SUCCESS ) {
-// 					std::cerr << " norm2( alpha, v, ring ) failed\n";
-// 					return rc;
-// 				}
-
-// 				rc = eWiseLambda(
-// 					[ &alpha, &ring, &divide, &minus ]( const size_t i, D &val ) {
-// 						if ( i == 0 ) {
-// 							Scalar< D > norm_v0( std::abs( val ) );
-// 							Scalar< D > val_scalar( val );
-// 							foldl( alpha, val_scalar, ring.getMultiplicativeOperator() );
-// 							foldl( alpha, norm_v0, divide );
-// 							foldl( val_scalar, alpha, minus );
-// 							val = *val_scalar;
-// 						}
-// 					},
-// 					v
-// 				);
-// 				if( rc != SUCCESS ) {
-// 					std::cerr << " eWiseLambda( lambda, v ) failed\n";
-// 					return rc;
-// 				}
-
-// 				Scalar< D > norm_v( zero );
-// 				rc = norm2( norm_v, v, ring );
-// 				if( rc != SUCCESS ) {
-// 					std::cerr << " norm2( norm_v, v, ring ) failed\n";
-// 					return rc;
-// 				}
-
-// 				rc = foldl(v, norm_v, divide );
-// #ifdef DEBUG
-// 				print_vector( " v = ", v );
-// #endif
-// 				// ===== End Computing v =====
-
-// 				// ===== Calculate reflector Qk =====
-// 				// Q_k = identity( n )
-// 				Matrix< D, SymmOrHermType, Dense > Qk( n );
-// 				rc = alp::set( Qk, zero );
-// 				auto Qk_diag = alp::get_view< alp::view::diagonal >( Qk );
-// 				rc = rc ? rc : alp::set( Qk_diag, one );
-
-// 				// this part can be rewriten without temp matrix using functors
-// 				Matrix< D, SymmOrHermType, Dense > vvt( m );
-
-// 				rc = rc ? rc : set( vvt, outer( v, ring.getMultiplicativeOperator() ) );
-// 				// vvt = 2 * vvt
-// 				rc = rc ? rc : foldr( Scalar< D >( 2 ), vvt, ring.getMultiplicativeOperator() );
-
-
-// #ifdef DEBUG
-// 				print_matrix( " vvt ", vvt );
-// #endif
-
-// 				// Qk = Qk - vvt ( expanded: I - 2 * vvt )
-// 				auto Qk_view = get_view< SymmOrHermType >( Qk, utils::range( k + 1, n ), utils::range( k + 1, n ) );
-// 				if ( grb::utils::is_complex< D >::value ) {
-// 					rc = rc ? rc : foldl( Qk_view, alp::get_view< alp::view::transpose >( vvt ), minus );
-// 				} else {
-// 					rc = rc ? rc : foldl( Qk_view, vvt, minus );
-// 				}
-
-// #ifdef DEBUG
-// 				print_matrix( " << Qk >> ", Qk );
-// #endif
-// 				// ===== End of Calculate reflector Qk ====
-
-// 				// ===== Update R =====
-// 				// Rk = Qk * Rk * Qk
-
-// 				// RRQk = RR * Qk
-// 				Matrix< D, structures::Square, Dense > RRQk( n );
-// 				rc = rc ? rc : set( RRQk, zero );
-// 				rc = rc ? rc : mxm( RRQk, RR, Qk, ring );
-// 				if( rc != SUCCESS ) {
-// 					std::cerr << " mxm( RRQk, RR, Qk, ring ); failed\n";
-// 					return rc;
-// 				}
-// #ifdef DEBUG
-// 				print_matrix( " << RR x Qk = >> ", RRQk );
-// #endif
-// 				// RR = Qk * RRQk
-// 				rc = rc ? rc : set( RR, zero );
-// 				rc = rc ? rc : mxm( RR, Qk, RRQk, ring );
-
-// #ifdef DEBUG
-// 				print_matrix( " << RR( updated ) >> ", RR );
-// #endif
-// 				// ===== End of Update R =====
-
-// 				// ===== Update Q =====
-// 				// Q = Q * Qk
-
-// 				// Qtmp = Q * Qk
-// 				rc = rc ? rc : set( Qtmp, zero );
-// 				rc = rc ? rc : mxm( Qtmp, Q, Qk, ring );
-
-// 				// Q = Qtmp
-// 				rc = rc ? rc : set( Q, Qtmp );
-// #ifdef DEBUG
-// 				print_matrix( " << Q updated >> ", Q );
-// #endif
-// 				// ===== End of Update Q =====
-// 			}
-
-// 			// T = RR
-
-// 			rc = rc ? rc : set( T, get_view< SymmOrHermTridiagonalType > ( RR ) );
+			const size_t n = nrows( T );
+			const size_t m = n / 2;
+
+			if( n == 1 ) {
+				//d=T[0];
+				rc = rc ? rc : eWiseLambda(
+					[ &d ]( const size_t i, const size_t j, D &val ) {
+						(void) i;
+						(void) j;
+						alp::set( d, Scalar< D > ( val ) );
+					},
+					T
+				);
+				// Q=array([[1]]);
+				rc = rc ? rc : alp::set( Q, one );
+
+				return rc;
+			}
+
+
+			Vector< D, structures::General, Dense > v( n );
+			rc = rc ? rc : set( v, zero );
+			rc = rc ? rc : eWiseLambda(
+				[ &T, &m, &ring ]( const size_t i, D &val ) {
+					if( i ==  m - 1 ) {
+						val = ring.template getOne< D >();
+					}
+					if( i ==  m) {
+						val = internal::access( T, internal::getStorageIndex( T, m - 1, m ) );
+					}
+				},
+				v
+			);
+#ifdef DEBUG
+			print_vector( " v = ", v );
+#endif
+			Matrix< D, SymmOrHermTridiagonalType, Dense > Atmp( n );
+			rc = rc ? rc : alp::set( Atmp, T );
+			auto vvt =  alp::outer( v, ring.getMultiplicativeOperator() ) ;
+
+#ifdef DEBUG
+			print_matrix( " Atmp(0) = ", Atmp );
+			print_matrix( " vvt = ", vvt );
+#endif
+			rc = rc ? rc : alp::foldl( Atmp, vvt, minus );
+
+#ifdef DEBUG
+			print_matrix( " Atmp(1) = ", Atmp );
+#endif
+
+			auto Ttop = get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( 0, m ), utils::range( 0, m ) );
+			auto Tdown = get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( m, n ), utils::range( m, n ) );
+
+#ifdef DEBUG
+			print_matrix( " Ttop = ", Ttop );
+			print_matrix( " Tdown = ", Tdown );
+#endif
+
+			Vector< D, structures::General, Dense > dtmp( n );
+			rc = rc ? rc : alp::set( dtmp, zero );
+			auto dtop = get_view( dtmp, utils::range( 0, m ) );
+			auto ddown = get_view( dtmp, utils::range( m, n ) );
+
+#ifdef DEBUG
+			print_vector( " dtop = ", dtop );
+			print_vector( " ddown = ", ddown );
+#endif
+
+			Matrix< D, OrthogonalType, Dense > U( n );
+			rc = rc ? rc : alp::set( U, zero );
+#ifdef DEBUG
+			print_matrix( " U = ", U );
+#endif
+			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
+
+#ifdef DEBUG
+			print_matrix( " Utop = ", Utop );
+#endif
+			auto Udown = get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
+
+#ifdef DEBUG
+			print_matrix( " Udown = ", Udown );
+#endif
+
+			rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
+			rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
+
+#ifdef DEBUG
+			std::cout << " after symm_tridiag_dac_eigensolver call:\n";
+			print_matrix( " Utop = ", Utop );
+			print_matrix( " Udown = ", Udown );
+			print_matrix( " U = ", U );
+#endif
+
+			Vector< D, structures::General, Dense > z( n );
+			rc = rc ? rc : alp::set( z, zero );
+
+#ifdef DEBUG
+			print_vector( "  v  ", v );
+			print_vector( "  z  ", z );
+#endif
+
+#ifdef TEMPDISABLE
+			// while mxv does not support vectors/view
+			// we cast vector->matrix and use mxm
+			auto z_mat_view = get_view< view::matrix >( z );
+			auto v_mat_view = get_view< view::matrix >( v );
+			rc = rc ? rc : mxm(
+				z_mat_view,
+				alp::get_view< alp::view::transpose >( U ),
+				v_mat_view,
+				ring
+			);
+#else
+			//z=U^T.dot(v)
+			rc = rc ? rc : mxv(
+				z,
+				alp::get_view< alp::view::transpose >( U ),
+				v,
+				ring
+			);
+#endif
+
+#ifdef DEBUG
+			print_vector( "  z  ", z );
+#endif
+
+			// permutations which sort dtmp
+			std::vector< size_t > isort_dtmp( n, 0 );
+			for( size_t i = 0 ; i < n ; ++i ) {
+				isort_dtmp[ i ] = i;
+			}
+			std::sort(
+				isort_dtmp.begin(),
+				isort_dtmp.end(),
+				[ &dtmp ]( const size_t &a, const size_t &b ) {
+					return ( dtmp[ a ] < dtmp[ b ] );
+				}
+			);
+#ifdef DEBUG
+			print_vector( "  dtmp  ", dtmp );
+			std::cout << " sort(dtmp) = \n";
+			std::cout << "    [ ";
+			for( size_t i = 0 ; i < n ; ++i ) {
+				std::cout << "\t" << dtmp[ isort_dtmp[ i ] ];
+			}
+			std::cout << " ]\n";
+#endif
+
+			// temp solution:
+			// dtmp2 and ztmp2 in the final version should be
+			// permutations views of dtmp and z, respectively
+			// instead, here we materialize permutations
+			Vector< D, structures::General, Dense > dtmp2( n );
+			Vector< D, structures::General, Dense > ztmp2( n );
+			rc = rc ? rc : alp::set( dtmp2, zero );
+			rc = rc ? rc : alp::set( ztmp2, zero );
+			for( size_t i = 0 ; i < n ; ++i ) {
+				dtmp2[ i ] = dtmp[ isort_dtmp[ i ] ];
+				ztmp2[ i ] = z[ isort_dtmp[ i ] ];
+			}
+#ifdef DEBUG
+			print_vector( "  dtmp2  ", dtmp2 );
+			print_vector( "  ztmp2  ", ztmp2 );
+#endif
+
+
+#ifdef TEMPDISABLE
+			// *********** diagDpOuter not implemented ***********
+			//nummerical wrong, missing diagDpOuter implementation
+			rc = rc ? rc : alp::set( d, dtmp2 );
+			//nummerical wrong, missing diagDpOuter implementation
+			Matrix< D, OrthogonalType, Dense > QdOuter( n );
+			rc = rc ? rc : alp::set( QdOuter, zero );
+			auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
+			rc = rc ? rc : alp::set( QdOuter_diag, one );
+			// ***************************************************
+#else
+			D,V= diagDpOuter( dtmp2, ztmp2 );
+#endif
+
+#ifdef DEBUG
+			print_matrix( "  QdOuter  ", QdOuter );
+#endif
+
+			// temp
+			// unpermute cols into QdOuterUnpermuted
+			Matrix< D, OrthogonalType, Dense > QdOuterUnpermuted( n );
+			rc = rc ? rc : alp::set( QdOuterUnpermuted, zero );
+			for( size_t i = 0 ; i < n ; ++i ) {
+				auto vin = get_view( QdOuter, utils::range( 0, n ), i );
+				auto vout = get_view( QdOuterUnpermuted, utils::range( 0, n ), isort_dtmp[ i ] );
+				rc = rc ? rc : alp::set( vout, vin );
+			}
+
+#ifdef DEBUG
+			print_matrix( "  QdOuterUnpermuted  ", QdOuterUnpermuted );
+#endif
+
+			// Q=U.dot((V[:,iiinv]).T)
+			rc = rc ? rc : alp::set( Q, zero );
+			rc = rc ? rc : mxm(
+				Q,
+				U,
+				alp::get_view< alp::view::transpose >( QdOuterUnpermuted ),
+				ring
+			);
+
 			return rc;
 		}
 	} // namespace algorithms
diff --git a/include/alp/storage.hpp b/include/alp/storage.hpp
index c957d971b..8d5adaef3 100644
--- a/include/alp/storage.hpp
+++ b/include/alp/storage.hpp
@@ -175,7 +175,7 @@ namespace alp {
 				typedef BivariateQuadratic< 1, 0, 0, 1, 2, 0, 2 > poly_type;
 
 				static poly_type Create( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 					(void) rows;
 #endif
@@ -184,7 +184,7 @@ namespace alp {
 				}
 
 				static size_t GetStorageDimensions( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 #endif
 					assert( rows == cols );
@@ -199,7 +199,7 @@ namespace alp {
 				typedef BivariateQuadratic< 0, 1, 0, 2, 1, 0, 2 > poly_type;
 
 				static poly_type Create( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 					(void) rows;
 #endif
@@ -208,7 +208,7 @@ namespace alp {
 				}
 
 				static size_t GetStorageDimensions( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 #endif
 					assert( rows == cols );
@@ -223,7 +223,7 @@ namespace alp {
 				typedef BivariateQuadratic< 1, 0, 0, 1, 2, 0, 2 > poly_type;
 
 				static poly_type Create( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 					(void) rows;
 #endif
@@ -232,7 +232,7 @@ namespace alp {
 				}
 
 				static size_t GetStorageDimensions( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 #endif
 					assert( rows == cols );
@@ -247,7 +247,7 @@ namespace alp {
 				typedef BivariateQuadratic< 0, 1, 0, 2, 1, 0, 2 > poly_type;
 
 				static poly_type Create( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) rows;
 					(void) cols;
 #endif
@@ -256,7 +256,7 @@ namespace alp {
 				}
 
 				static size_t GetStorageDimensions( const size_t rows, const size_t cols ) {
-#ifndef DEBUG
+#ifdef NDEBUG
 					(void) cols;
 #endif
 					assert( rows == cols );
diff --git a/include/alp/structures.hpp b/include/alp/structures.hpp
index 03647dbd3..950f6204b 100644
--- a/include/alp/structures.hpp
+++ b/include/alp/structures.hpp
@@ -544,6 +544,14 @@ namespace alp {
 				>::type;
 		};
 
+		template<>
+		struct isInstantiable< SymmetricTridiagonal, SymmetricTridiagonal > {
+			template< typename ImfR, typename ImfC >
+			static bool check( const ImfR &imf_r, const ImfC &imf_c ) {
+				return imf_r.isSame(imf_c);
+			};
+		};
+
 		struct HermitianTridiagonal: BaseStructure {
 
 			private:
@@ -621,6 +629,14 @@ namespace alp {
 			using inferred_structures = tuple_cat< std::tuple< Orthogonal >, NonSingular::inferred_structures, OrthogonalColumns::inferred_structures, OrthogonalRows::inferred_structures >::type;
 		};
 
+		template<>
+		struct isInstantiable< Orthogonal, Orthogonal > {
+			template< typename ImfR, typename ImfC >
+			static bool check( const ImfR &imf_r, const ImfC &imf_c ) {
+				return imf_r.isSame(imf_c);
+			};
+		};
+
 		struct Constant: BaseStructure {
 
 			typedef std::tuple< OpenInterval > band_intervals;
diff --git a/tests/smoke/alp_stedc.cpp b/tests/smoke/alp_stedc.cpp
index 742893d76..e873ed7b7 100644
--- a/tests/smoke/alp_stedc.cpp
+++ b/tests/smoke/alp_stedc.cpp
@@ -47,13 +47,17 @@ using Orthogonal = structures::Orthogonal;
 // using HermitianOrSymmetric = structures::Hermitian;
 // #else
 using ScalarType = BaseScalarType;
+
+//temp
 using HermitianOrSymmetricTridiagonal = structures::SymmetricTridiagonal;
+//using HermitianOrSymmetricTridiagonal = structures::Square;
+
 //fully implemented structures
 using HermitianOrSymmetric = structures::Symmetric;
 // #endif
 
 constexpr BaseScalarType tol = 1.e-10;
-constexpr size_t RNDSEED = 1;
+constexpr size_t RNDSEED = 11235;
 
 //temp function untill Hermitian containter is implemented
 //** gnerate symmetric-hermitian matrix in a square container */
@@ -260,14 +264,15 @@ void alp_program( const size_t & unit, alp::RC & rc ) {
 		alp::identities::zero,
 		alp::identities::one
 	> ring;
+	const Scalar< ScalarType > zero_scalar( ring.template getZero< ScalarType >() );
 
 	// dimensions of sqare matrices H, Q and R
 	size_t N = unit;
 
 	alp::Matrix< ScalarType, Orthogonal > Q( N );
 	alp::Matrix< ScalarType, HermitianOrSymmetricTridiagonal > T( N );
-	// Vector< ScalarType, structures::General, Dense > d( N );
 	Vector< ScalarType, structures::General, Dense > d( N );
+	rc = rc ? rc : set( d, zero_scalar );
 	{
 		auto matrix_data = generate_symmherm_tridiag_matrix_data< ScalarType >( N );
 		rc = rc ? rc : alp::buildMatrix( T, matrix_data.begin(), matrix_data.end() );
@@ -276,13 +281,18 @@ void alp_program( const size_t & unit, alp::RC & rc ) {
 	print_matrix( " input matrix T ", T );
 #endif
 
-  	rc = rc ? rc : algorithms::symm_tridiag_eigensolver( T, Q, d );
+  	rc = rc ? rc : algorithms::symm_tridiag_dac_eigensolver(
+		T,
+		Q,
+		d,
+		ring
+	);
 
 
-// #ifdef DEBUG
-// 	print_matrix( " << Q >> ", Q );
-// 	print_matrix( " << T >> ", T );
-// #endif
+#ifdef DEBUG
+	print_matrix( " << Q >> ", Q );
+	print_matrix( " << T >> ", T );
+#endif
 
 // 	rc = check_overlap( Q );
 // 	if( rc != SUCCESS ) {

From e32ed384ffc1452f8125971fc06211f905e9d31a Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Fri, 14 Oct 2022 09:52:28 +0200
Subject: [PATCH 03/14] eigensolveDiagPlusOuter

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 116 ++++++++++++++++--
 1 file changed, 109 insertions(+), 7 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 1a341d869..c783175a8 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -28,6 +28,103 @@ namespace alp {
 
 	namespace algorithms {
 
+		/**
+		 * Calcualte eigendecomposition of system D + vvt
+		 *        \f$D = diag(d)$ is diagonal matrix and
+		 *        \a vvt outer product outer(v,v)
+		 *
+		 * @tparam D        Data element type
+		 * @tparam Ring     Type of the semiring used in the computation
+		 * @tparam Minus    Type minus operator used in the computation
+		 * @tparam Divide   Type of divide operator used in the computation
+		 * @param[out] Egvecs    output orthogonal matrix contaning eigenvectors
+		 * @param[out] egvals    output vector containg eigenvalues
+		 * @param[in]  ring A semiring for operations
+		 * @return RC       SUCCESS if the execution was correct
+		 *
+		 */
+		template<
+			typename D,
+			typename VecView1,
+			typename VecImfR1,
+			typename VecImfC1,
+			typename VecView2,
+			typename VecImfR2,
+			typename VecImfC2,
+			typename VecView3,
+			typename VecImfR3,
+			typename VecImfC3,
+			typename OrthogonalType,
+			typename OrthViewType,
+			typename OrthViewImfR,
+			typename OrthViewImfC,
+			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
+			class Minus = operators::subtract< D >,
+			class Divide = operators::divide< D >
+		>
+		RC eigensolveDiagPlusOuter(
+			Vector<	D, structures::General,	Dense, VecView1, VecImfR1, VecImfC1 > &egvals,
+			Matrix< D, OrthogonalType, Dense, OrthViewType, OrthViewImfR, OrthViewImfC > &Egvecs,
+			Vector<	D, structures::General, Dense, VecView2, VecImfR2, VecImfC2 > &d,
+			Vector< D, structures::General, Dense, VecView3, VecImfR3, VecImfC3 > &v,
+			const Ring & ring = Ring(),
+			const Minus & minus = Minus(),
+			const Divide & divide = Divide()
+		) {
+			RC rc = SUCCESS;
+
+			const size_t n = nrows( Egvecs );
+
+			const double eps = 1.e-7;
+			// if(min(abs(v))<eps):
+			//     ii=where(abs(v)<eps)[0]
+			//     for i in ii:
+			//         egvs[i]=d[i]
+			//         dvec=zeros(len(d))
+			//         dvec[i]=1
+			//         egvecs[i]=dvec
+			//     d=d[~(abs(v0)<eps)]
+			//     v=v[~(abs(v0)<eps)]
+			for( size_t i = 0; i < n; i++ ) {
+//				if( std::abs( v[ i ] ) < eps ) {
+					//simple egval formula ;
+					//set eigenvalue
+					egvals[ i ] = d[ i ];
+					//set eigenvector
+					//(could be done without temp vector by using eWiseLambda)
+					Vector< D, structures::General, Dense > dvec( n );
+					alp::set( dvec, Scalar< D > ( ring.template getZero< D >() ) );
+					dvec[ i ] = ring.template getOne< D >();
+					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, n ), i );
+					rc = rc ? rc : alp::set( Egvecs_vec_view, dvec );
+//				} else {
+//					//complicated egval formula ;
+//				}
+			}
+
+
+			// for i in range(len(d)):
+			//     egval,lambdax,dvec = zerodandc(d,v,i)
+			//     dlam=dlam+[lambdax]
+			//     #egvecs=egvecs+[dvec]
+			//     dvec=v/dvec
+			//     dvec=dvec/norm(dvec)
+			//     egvecs_tmp=egvecs_tmp+[dvec]
+			//     egvs_tmp=egvs_tmp+[egval]
+			// egvecs_tmp=array(egvecs_tmp)
+			// egvs_tmp=array(egvs_tmp)
+
+			// egvecs_tmp=array(egvecs_tmp)
+			// egvs_tmp=array(egvs_tmp)
+			// egvs[~(abs(v0)<eps)]=egvs_tmp
+			// for j,i in enumerate(where(~(abs(v0)<eps))[0]):
+			//     egvecs[i,~(abs(v0)<eps)]=egvecs_tmp[j]
+
+
+			return rc;
+		}
+
+
 		/**
 		 * Calcualte eigendecomposition of symmetric tridiagonal matrix T
 		 *        \f$T = Qdiag(d)Q^T\f$ where
@@ -269,15 +366,20 @@ namespace alp {
 
 
 #ifdef TEMPDISABLE
-			// *********** diagDpOuter not implemented ***********
-			//nummerical wrong, missing diagDpOuter implementation
-			rc = rc ? rc : alp::set( d, dtmp2 );
-			//nummerical wrong, missing diagDpOuter implementation
+			// // *********** diagDpOuter not implemented ***********
+			// //nummerical wrong, missing diagDpOuter implementation
+			// rc = rc ? rc : alp::set( d, dtmp2 );
+			// //nummerical wrong, missing diagDpOuter implementation
+			// Matrix< D, OrthogonalType, Dense > QdOuter( n );
+			// rc = rc ? rc : alp::set( QdOuter, zero );
+			// auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
+			// rc = rc ? rc : alp::set( QdOuter_diag, one );
+			// // ***************************************************
+
+			rc = rc ? rc : alp::set( d, zero );
 			Matrix< D, OrthogonalType, Dense > QdOuter( n );
 			rc = rc ? rc : alp::set( QdOuter, zero );
-			auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
-			rc = rc ? rc : alp::set( QdOuter_diag, one );
-			// ***************************************************
+			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter, dtmp2, ztmp2 );
 #else
 			D,V= diagDpOuter( dtmp2, ztmp2 );
 #endif

From 1f185ee1d7aaf797a73efa03ee7cf0488dd442be Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Tue, 18 Oct 2022 14:33:36 +0200
Subject: [PATCH 04/14] find zeroes of secular polynomial using bisections

function name: bisec_sec_eq

this is not an optimal solution and it might be relaced later
---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 237 +++++++++++++-----
 1 file changed, 176 insertions(+), 61 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index c783175a8..caa0f5601 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -28,6 +28,86 @@ namespace alp {
 
 	namespace algorithms {
 
+		/**
+		 * find zero of secular equation in interval <a,b>
+		 * using bisection
+		 * this is not an optimal algorithm and there are many
+		 * more efficient implantation
+		 */
+		template<
+			typename D,
+			typename VecView1,
+			typename VecImfR1,
+			typename VecImfC1,
+			typename VecView2,
+			typename VecImfR2,
+			typename VecImfC2,
+			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
+			class Minus = operators::subtract< D >,
+			class Divide = operators::divide< D >
+		>
+		RC bisec_sec_eq(
+			Scalar< D > &lambda,
+			const Vector<	D, structures::General,	Dense, VecView1, VecImfR1, VecImfC1 > &d,
+			// Vector v should be const, but that would disable eWiseLambda, to be resolved in the future
+			Vector<	D, structures::General,	Dense, VecView2, VecImfR2, VecImfC2 > &v,
+			const Scalar< D > &a,
+			const Scalar< D > &b,
+			const D tol=1.e-12,
+			const Ring & ring = Ring(),
+			const Minus & minus = Minus(),
+			const Divide & divide = Divide()
+		) {
+			RC rc = SUCCESS;
+
+#ifdef DEBUG
+			std::cout << " a = " << *a << " ";
+			std::cout << " b = " << *b << " ";
+#endif
+
+			const Scalar< D > zero( ring.template getZero< D >() );
+			const Scalar< D > one( ring.template getOne< D >() );
+			Scalar< D > x0( ( *a + *b ) / ( 2 ) );
+
+			if( std::abs( *a - *b ) < tol ) {
+				alp::set( lambda, x0 );
+				return rc;
+			}
+
+			//fx0=1+sum(v**2/(d-x0))
+			Scalar< D > fx0( one );
+			rc = rc ? rc : eWiseLambda(
+				[ &d, &x0, &fx0, &ring, &minus, &divide ]( const size_t i, D &val ) {
+					Scalar< D > alpha( val );
+					Scalar< D > beta( d[ i ] );
+					foldl( alpha, Scalar< D > ( val ), ring.getMultiplicativeOperator() );
+					foldl( beta, x0, minus );
+					foldl( alpha, beta, divide );
+					foldl( fx0, alpha, ring.getAdditiveOperator() );
+				},
+				v
+			);
+
+#ifdef DEBUG
+			std::cout << " x0 = " << *x0 << " ";
+			std::cout << " fx0 = " << *fx0 << "\n";
+#endif
+
+			if( std::abs( *fx0 ) < tol ) {
+				alp::set( lambda, x0 );
+				return rc;
+			}
+
+			if( *fx0 < *zero ) {
+				rc = rc ? rc : bisec_sec_eq( lambda, d, v, x0, b, tol );
+			} else {
+				rc = rc ? rc : bisec_sec_eq( lambda, d, v, a, x0, tol );
+			}
+
+			return rc;
+		}
+
+
 		/**
 		 * Calcualte eigendecomposition of system D + vvt
 		 *        \f$D = diag(d)$ is diagonal matrix and
@@ -73,53 +153,117 @@ namespace alp {
 		) {
 			RC rc = SUCCESS;
 
+			const Scalar< D > zero( ring.template getZero< D >() );
+			const Scalar< D > one( ring.template getOne< D >() );
 			const size_t n = nrows( Egvecs );
-
 			const double eps = 1.e-7;
-			// if(min(abs(v))<eps):
-			//     ii=where(abs(v)<eps)[0]
-			//     for i in ii:
-			//         egvs[i]=d[i]
-			//         dvec=zeros(len(d))
-			//         dvec[i]=1
-			//         egvecs[i]=dvec
-			//     d=d[~(abs(v0)<eps)]
-			//     v=v[~(abs(v0)<eps)]
+
+			size_t non_trivial_egvc_count = 0;
+			Vector< D, structures::General, Dense > d_nontrv( n );
+			Vector< D, structures::General, Dense > v_nontrv( n );
+			alp::set( d_nontrv, zero );
+			alp::set( v_nontrv, zero );
+
 			for( size_t i = 0; i < n; i++ ) {
-//				if( std::abs( v[ i ] ) < eps ) {
+				if( std::abs( v[ i ] ) < eps ) {
 					//simple egval formula ;
 					//set eigenvalue
 					egvals[ i ] = d[ i ];
 					//set eigenvector
 					//(could be done without temp vector by using eWiseLambda)
 					Vector< D, structures::General, Dense > dvec( n );
-					alp::set( dvec, Scalar< D > ( ring.template getZero< D >() ) );
-					dvec[ i ] = ring.template getOne< D >();
+					alp::set( dvec, zero );
+					dvec[ i ] = *one;
 					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, n ), i );
 					rc = rc ? rc : alp::set( Egvecs_vec_view, dvec );
-//				} else {
-//					//complicated egval formula ;
-//				}
+				} else {
+					//complicated egval formula ;
+					d_nontrv[ non_trivial_egvc_count ] = d[ i ];
+					v_nontrv[ non_trivial_egvc_count ] = v[ i ];
+					++non_trivial_egvc_count;
+				}
 			}
 
+			auto d_nontrv_nnz_view = get_view( d_nontrv, utils::range( 0, non_trivial_egvc_count ) );
+			auto v_nontrv_nnz_view = get_view( v_nontrv, utils::range( 0, non_trivial_egvc_count ) );
+
+			Vector< D, structures::General, Dense > egvals_nontrv( non_trivial_egvc_count );
+			Matrix< D, OrthogonalType, Dense > Egvecs_nontrv( non_trivial_egvc_count );
+			rc = rc ? rc : alp::set( egvals_nontrv, zero );
+			rc = rc ? rc : alp::set( Egvecs_nontrv, zero );
 
-			// for i in range(len(d)):
-			//     egval,lambdax,dvec = zerodandc(d,v,i)
-			//     dlam=dlam+[lambdax]
-			//     #egvecs=egvecs+[dvec]
-			//     dvec=v/dvec
-			//     dvec=dvec/norm(dvec)
-			//     egvecs_tmp=egvecs_tmp+[dvec]
-			//     egvs_tmp=egvs_tmp+[egval]
-			// egvecs_tmp=array(egvecs_tmp)
-			// egvs_tmp=array(egvs_tmp)
+#ifdef DEBUG
+			print_vector( "eigensolveDiagPlusOuter: d ", d );
+			print_vector( "eigensolveDiagPlusOuter: v ", v );
+			print_vector( "eigensolveDiagPlusOuter: d_nontrv_nnz_view ", d_nontrv_nnz_view );
+			print_vector( "eigensolveDiagPlusOuter: v_nontrv_nnz_view ", v_nontrv_nnz_view );
+
+			for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+				std::cout << " ============ i= " << i << "  ============\n";
 
-			// egvecs_tmp=array(egvecs_tmp)
-			// egvs_tmp=array(egvs_tmp)
-			// egvs[~(abs(v0)<eps)]=egvs_tmp
-			// for j,i in enumerate(where(~(abs(v0)<eps))[0]):
-			//     egvecs[i,~(abs(v0)<eps)]=egvecs_tmp[j]
+				std::cout << " d = array([";
+				for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+					std::cout << d_nontrv_nnz_view[ i ] << ", ";
+				}
+				std::cout << " ])\n";
+				std::cout << " v = array([";
+				for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+					std::cout << v_nontrv_nnz_view[ i ] << ", ";
+				}
+				std::cout << " ])\n";
+
+				Scalar< D > a( d_nontrv_nnz_view[ i ] );
+				Scalar< D > b( d_nontrv_nnz_view[ i ] );
+				std::cout << "0 a,b=" << *a << " " << *b << "\n";
+				if( i + 1 < non_trivial_egvc_count  ) {
+					std::cout << " alp::set b to <<" << d_nontrv_nnz_view[ i + 1 ] << ">> \n";
+					rc = alp::set( b, Scalar< D >( d_nontrv_nnz_view[ i + 1 ] ) );
+					if( rc != SUCCESS ) {
+						std::cout << " **** alp::set failed ***** \n";
+					}
+					std::cout << "1  a,b=" << *a << " " << *b << "\n";
+				} else {
+					Scalar< D > alpha( zero );
+					rc = rc ? rc : norm2( alpha, v, ring );
+					foldl( b, alpha, ring.getAdditiveOperator() );
+					std::cout << "2 a,b=" << *a << " " << *b << "\n";
+				}
+				Scalar< D > lambda( ( *a - *b ) / 2 );
 
+				std::cout << " a,lambda,b=" << *a << " " << *lambda << " " << *b << "\n";
+
+				rc = rc ? rc : bisec_sec_eq( lambda, d_nontrv_nnz_view, v_nontrv_nnz_view, a, b );
+				std::cout << " lambda (" << i << ") = " << *lambda << "\n";
+			}
+#endif
+
+
+#ifdef TEMPDISABLE
+			for( size_t i = 0; i < non_trivial_egvc_count; i++ ) {
+				egvals_nontrv[ i ] = d_nontrv[ i ];
+				Vector< D, structures::General, Dense > dvec( non_trivial_egvc_count );
+				alp::set( dvec, zero );
+				dvec[ i ] = *one;
+				auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), i );
+				rc = rc ? rc : alp::set( Egvecs_nontrv_vec_view, dvec );
+			}
+#else
+			not implemented;
+#endif
+
+			//copy egvals_nontrv and Egvecs_nontrv into egvals and Egvecs
+			size_t k = 0;
+			for( size_t i = 0; i < n; i++ ) {
+				if( !( std::abs( v[ i ] ) < eps ) ) {
+					egvals[ i ] = egvals_nontrv[ k ];
+					//resolve this with select/permute view
+#ifdef TEMPDISABLE
+					auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), k );
+					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, non_trivial_egvc_count ), i ); // this is wrong
+					rc = rc ? rc : alp::set( Egvecs_vec_view, Egvecs_nontrv_vec_view );
+#endif
+				}
+			}
 
 			return rc;
 		}
@@ -261,27 +405,12 @@ namespace alp {
 			auto dtop = get_view( dtmp, utils::range( 0, m ) );
 			auto ddown = get_view( dtmp, utils::range( m, n ) );
 
-#ifdef DEBUG
-			print_vector( " dtop = ", dtop );
-			print_vector( " ddown = ", ddown );
-#endif
-
 			Matrix< D, OrthogonalType, Dense > U( n );
 			rc = rc ? rc : alp::set( U, zero );
-#ifdef DEBUG
-			print_matrix( " U = ", U );
-#endif
-			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
 
-#ifdef DEBUG
-			print_matrix( " Utop = ", Utop );
-#endif
+			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
 			auto Udown = get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
 
-#ifdef DEBUG
-			print_matrix( " Udown = ", Udown );
-#endif
-
 			rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
 			rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
 
@@ -365,24 +494,10 @@ namespace alp {
 #endif
 
 
-#ifdef TEMPDISABLE
-			// // *********** diagDpOuter not implemented ***********
-			// //nummerical wrong, missing diagDpOuter implementation
-			// rc = rc ? rc : alp::set( d, dtmp2 );
-			// //nummerical wrong, missing diagDpOuter implementation
-			// Matrix< D, OrthogonalType, Dense > QdOuter( n );
-			// rc = rc ? rc : alp::set( QdOuter, zero );
-			// auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
-			// rc = rc ? rc : alp::set( QdOuter_diag, one );
-			// // ***************************************************
-
 			rc = rc ? rc : alp::set( d, zero );
 			Matrix< D, OrthogonalType, Dense > QdOuter( n );
 			rc = rc ? rc : alp::set( QdOuter, zero );
 			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter, dtmp2, ztmp2 );
-#else
-			D,V= diagDpOuter( dtmp2, ztmp2 );
-#endif
 
 #ifdef DEBUG
 			print_matrix( "  QdOuter  ", QdOuter );

From 4b8346012a7208b2d7ddd7e31926284ee724db90 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Tue, 18 Oct 2022 15:58:23 +0200
Subject: [PATCH 05/14] tmp

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 287 ++++++++++--------
 1 file changed, 160 insertions(+), 127 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index caa0f5601..f33690422 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -158,112 +158,152 @@ namespace alp {
 			const size_t n = nrows( Egvecs );
 			const double eps = 1.e-7;
 
-			size_t non_trivial_egvc_count = 0;
-			Vector< D, structures::General, Dense > d_nontrv( n );
-			Vector< D, structures::General, Dense > v_nontrv( n );
-			alp::set( d_nontrv, zero );
-			alp::set( v_nontrv, zero );
+			// all egvec/val are trivial when the corresponding
+			// element of v is zero
+			size_t count_direct_egvc = 0;
+			size_t count_non_direct_egvc = 0;
+
+			std::vector< size_t > direct_egvc_indx( n, 0 );
+			std::vector< size_t > non_direct_egvc_indx( n, 0 );
 
 			for( size_t i = 0; i < n; i++ ) {
 				if( std::abs( v[ i ] ) < eps ) {
 					//simple egval formula ;
-					//set eigenvalue
-					egvals[ i ] = d[ i ];
-					//set eigenvector
-					//(could be done without temp vector by using eWiseLambda)
-					Vector< D, structures::General, Dense > dvec( n );
-					alp::set( dvec, zero );
-					dvec[ i ] = *one;
-					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, n ), i );
-					rc = rc ? rc : alp::set( Egvecs_vec_view, dvec );
+					direct_egvc_indx[ count_direct_egvc ] = i ;
+					++count_direct_egvc;
 				} else {
 					//complicated egval formula ;
-					d_nontrv[ non_trivial_egvc_count ] = d[ i ];
-					v_nontrv[ non_trivial_egvc_count ] = v[ i ];
-					++non_trivial_egvc_count;
+					non_direct_egvc_indx[ count_non_direct_egvc ] = i;
+					++count_non_direct_egvc;
 				}
 			}
-
-			auto d_nontrv_nnz_view = get_view( d_nontrv, utils::range( 0, non_trivial_egvc_count ) );
-			auto v_nontrv_nnz_view = get_view( v_nontrv, utils::range( 0, non_trivial_egvc_count ) );
-
-			Vector< D, structures::General, Dense > egvals_nontrv( non_trivial_egvc_count );
-			Matrix< D, OrthogonalType, Dense > Egvecs_nontrv( non_trivial_egvc_count );
-			rc = rc ? rc : alp::set( egvals_nontrv, zero );
-			rc = rc ? rc : alp::set( Egvecs_nontrv, zero );
+			direct_egvc_indx.resize( count_direct_egvc );
+			non_direct_egvc_indx.resize( count_non_direct_egvc );
+			alp::Vector< size_t > select_direct( count_direct_egvc );
+			alp::Vector< size_t > select_non_direct( count_non_direct_egvc );
+			alp::buildVector( select_direct, direct_egvc_indx.begin(), direct_egvc_indx.end() );
+			alp::buildVector( select_non_direct, non_direct_egvc_indx.begin(), non_direct_egvc_indx.end() );
 
 #ifdef DEBUG
-			print_vector( "eigensolveDiagPlusOuter: d ", d );
-			print_vector( "eigensolveDiagPlusOuter: v ", v );
-			print_vector( "eigensolveDiagPlusOuter: d_nontrv_nnz_view ", d_nontrv_nnz_view );
-			print_vector( "eigensolveDiagPlusOuter: v_nontrv_nnz_view ", v_nontrv_nnz_view );
-
-			for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-				std::cout << " ============ i= " << i << "  ============\n";
-
-				std::cout << " d = array([";
-				for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-					std::cout << d_nontrv_nnz_view[ i ] << ", ";
-				}
-				std::cout << " ])\n";
-				std::cout << " v = array([";
-				for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-					std::cout << v_nontrv_nnz_view[ i ] << ", ";
-				}
-				std::cout << " ])\n";
-
-				Scalar< D > a( d_nontrv_nnz_view[ i ] );
-				Scalar< D > b( d_nontrv_nnz_view[ i ] );
-				std::cout << "0 a,b=" << *a << " " << *b << "\n";
-				if( i + 1 < non_trivial_egvc_count  ) {
-					std::cout << " alp::set b to <<" << d_nontrv_nnz_view[ i + 1 ] << ">> \n";
-					rc = alp::set( b, Scalar< D >( d_nontrv_nnz_view[ i + 1 ] ) );
-					if( rc != SUCCESS ) {
-						std::cout << " **** alp::set failed ***** \n";
-					}
-					std::cout << "1  a,b=" << *a << " " << *b << "\n";
-				} else {
-					Scalar< D > alpha( zero );
-					rc = rc ? rc : norm2( alpha, v, ring );
-					foldl( b, alpha, ring.getAdditiveOperator() );
-					std::cout << "2 a,b=" << *a << " " << *b << "\n";
-				}
-				Scalar< D > lambda( ( *a - *b ) / 2 );
-
-				std::cout << " a,lambda,b=" << *a << " " << *lambda << " " << *b << "\n";
-
-				rc = rc ? rc : bisec_sec_eq( lambda, d_nontrv_nnz_view, v_nontrv_nnz_view, a, b );
-				std::cout << " lambda (" << i << ") = " << *lambda << "\n";
-			}
+			std::cout << " count_direct_egvc = " << count_direct_egvc << "\n";
+			std::cout << " count_non_direct_egvc = " << count_non_direct_egvc << "\n";
 #endif
+			auto egvals_direct = get_view< alp::structures::General >( egvals, select_direct );
+			auto egvals_non_direct = get_view< alp::structures::General >( egvals, select_non_direct );
 
+			auto Egvecs_direct = alp::get_view< alp::structures::Orthogonal >(
+				Egvecs, select_direct, select_direct
+			);
+			auto Egvecs_non_direct = alp::get_view< alp::structures::Orthogonal >(
+				Egvecs, select_non_direct, select_non_direct
+			);
 
-#ifdef TEMPDISABLE
-			for( size_t i = 0; i < non_trivial_egvc_count; i++ ) {
-				egvals_nontrv[ i ] = d_nontrv[ i ];
-				Vector< D, structures::General, Dense > dvec( non_trivial_egvc_count );
-				alp::set( dvec, zero );
-				dvec[ i ] = *one;
-				auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), i );
-				rc = rc ? rc : alp::set( Egvecs_nontrv_vec_view, dvec );
-			}
-#else
-			not implemented;
-#endif
 
-			//copy egvals_nontrv and Egvecs_nontrv into egvals and Egvecs
-			size_t k = 0;
-			for( size_t i = 0; i < n; i++ ) {
-				if( !( std::abs( v[ i ] ) < eps ) ) {
-					egvals[ i ] = egvals_nontrv[ k ];
-					//resolve this with select/permute view
-#ifdef TEMPDISABLE
-					auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), k );
-					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, non_trivial_egvc_count ), i ); // this is wrong
-					rc = rc ? rc : alp::set( Egvecs_vec_view, Egvecs_nontrv_vec_view );
-#endif
-				}
-			}
+			// Vector< D, structures::General, Dense > d_nontrv( n );
+			// Vector< D, structures::General, Dense > v_nontrv( n );
+			// alp::set( d_nontrv, zero );
+			// alp::set( v_nontrv, zero );
+
+			// for( size_t i = 0; i < n; i++ ) {
+			// 	if( std::abs( v[ i ] ) < eps ) {
+			// 		//simple egval formula ;
+			// 		//set eigenvalue
+			// 		egvals[ i ] = d[ i ];
+			// 		//set eigenvector
+			// 		//(could be done without temp vector by using eWiseLambda)
+			// 		Vector< D, structures::General, Dense > dvec( n );
+			// 		alp::set( dvec, zero );
+			// 		dvec[ i ] = *one;
+			// 		auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, n ), i );
+			// 		rc = rc ? rc : alp::set( Egvecs_vec_view, dvec );
+			// 	} else {
+			// 		//complicated egval formula ;
+			// 		d_nontrv[ non_trivial_egvc_count ] = d[ i ];
+			// 		v_nontrv[ non_trivial_egvc_count ] = v[ i ];
+			// 		++non_trivial_egvc_count;
+			// 	}
+			// }
+
+			// auto d_nontrv_nnz_view = get_view( d_nontrv, utils::range( 0, non_trivial_egvc_count ) );
+			// auto v_nontrv_nnz_view = get_view( v_nontrv, utils::range( 0, non_trivial_egvc_count ) );
+
+			// Vector< D, structures::General, Dense > egvals_nontrv( non_trivial_egvc_count );
+			// Matrix< D, OrthogonalType, Dense > Egvecs_nontrv( non_trivial_egvc_count );
+			// rc = rc ? rc : alp::set( egvals_nontrv, zero );
+			// rc = rc ? rc : alp::set( Egvecs_nontrv, zero );
+
+// #ifdef DEBUG
+// 			print_vector( "eigensolveDiagPlusOuter: d ", d );
+// 			print_vector( "eigensolveDiagPlusOuter: v ", v );
+// 			print_vector( "eigensolveDiagPlusOuter: d_nontrv_nnz_view ", d_nontrv_nnz_view );
+// 			print_vector( "eigensolveDiagPlusOuter: v_nontrv_nnz_view ", v_nontrv_nnz_view );
+
+// 			// for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+// 			// 	std::cout << " ============ i= " << i << "  ============\n";
+
+// 			// 	std::cout << " d = array([";
+// 			// 	for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+// 			// 		std::cout << d_nontrv_nnz_view[ i ] << ", ";
+// 			// 	}
+// 			// 	std::cout << " ])\n";
+// 			// 	std::cout << " v = array([";
+// 			// 	for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
+// 			// 		std::cout << v_nontrv_nnz_view[ i ] << ", ";
+// 			// 	}
+// 			// 	std::cout << " ])\n";
+
+// 			// 	Scalar< D > a( d_nontrv_nnz_view[ i ] );
+// 			// 	Scalar< D > b( d_nontrv_nnz_view[ i ] );
+// 			// 	std::cout << "0 a,b=" << *a << " " << *b << "\n";
+// 			// 	if( i + 1 < non_trivial_egvc_count  ) {
+// 			// 		std::cout << " alp::set b to <<" << d_nontrv_nnz_view[ i + 1 ] << ">> \n";
+// 			// 		rc = alp::set( b, Scalar< D >( d_nontrv_nnz_view[ i + 1 ] ) );
+// 			// 		if( rc != SUCCESS ) {
+// 			// 			std::cout << " **** alp::set failed ***** \n";
+// 			// 		}
+// 			// 		std::cout << "1  a,b=" << *a << " " << *b << "\n";
+// 			// 	} else {
+// 			// 		Scalar< D > alpha( zero );
+// 			// 		rc = rc ? rc : norm2( alpha, v, ring );
+// 			// 		foldl( b, alpha, ring.getAdditiveOperator() );
+// 			// 		std::cout << "2 a,b=" << *a << " " << *b << "\n";
+// 			// 	}
+// 			// 	Scalar< D > lambda( ( *a - *b ) / 2 );
+
+// 			// 	std::cout << " a,lambda,b=" << *a << " " << *lambda << " " << *b << "\n";
+
+// 			// 	rc = rc ? rc : bisec_sec_eq( lambda, d_nontrv_nnz_view, v_nontrv_nnz_view, a, b );
+// 			// 	std::cout << " lambda (" << i << ") = " << *lambda << "\n";
+// 			}
+// #endif
+
+
+// #ifdef TEMPDISABLE
+// 			for( size_t i = 0; i < non_trivial_egvc_count; i++ ) {
+// 				egvals_nontrv[ i ] = d_nontrv[ i ];
+// 				Vector< D, structures::General, Dense > dvec( non_trivial_egvc_count );
+// 				alp::set( dvec, zero );
+// 				dvec[ i ] = *one;
+// 				auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), i );
+// 				rc = rc ? rc : alp::set( Egvecs_nontrv_vec_view, dvec );
+// 			}
+// #else
+// 			not implemented;
+// #endif
+
+// 			//copy egvals_nontrv and Egvecs_nontrv into egvals and Egvecs
+// 			size_t k = 0;
+// 			for( size_t i = 0; i < n; i++ ) {
+// 				if( !( std::abs( v[ i ] ) < eps ) ) {
+// 					egvals[ i ] = egvals_nontrv[ k ];
+// 					//resolve this with select/permute view
+// #ifdef TEMPDISABLE
+// 					auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), k );
+// 					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, non_trivial_egvc_count ), i ); // this is wrong
+// 					rc = rc ? rc : alp::set( Egvecs_vec_view, Egvecs_nontrv_vec_view );
+// #endif
+// 				}
+// 			}
 
 			return rc;
 		}
@@ -411,8 +451,9 @@ namespace alp {
 			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
 			auto Udown = get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
 
-			rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
-			rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
+			// rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
+			// rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
+			std::cout << " --> ust one iteration\n";
 
 #ifdef DEBUG
 			std::cout << " after symm_tridiag_dac_eigensolver call:\n";
@@ -466,28 +507,27 @@ namespace alp {
 					return ( dtmp[ a ] < dtmp[ b ] );
 				}
 			);
+			alp::Vector< size_t > permutation_vec( n );
+			alp::buildVector( permutation_vec, isort_dtmp.begin(), isort_dtmp.end() );
+
 #ifdef DEBUG
 			print_vector( "  dtmp  ", dtmp );
-			std::cout << " sort(dtmp) = \n";
-			std::cout << "    [ ";
-			for( size_t i = 0 ; i < n ; ++i ) {
-				std::cout << "\t" << dtmp[ isort_dtmp[ i ] ];
-			}
-			std::cout << " ]\n";
+			// std::cout << " sort(dtmp) = \n";
+			// std::cout << "    [ ";
+			// for( size_t i = 0 ; i < n ; ++i ) {
+			// 	std::cout << "\t" << dtmp[ isort_dtmp[ i ] ];
+			// }
+			// std::cout << " ]\n";
 #endif
 
-			// temp solution:
-			// dtmp2 and ztmp2 in the final version should be
-			// permutations views of dtmp and z, respectively
-			// instead, here we materialize permutations
-			Vector< D, structures::General, Dense > dtmp2( n );
-			Vector< D, structures::General, Dense > ztmp2( n );
-			rc = rc ? rc : alp::set( dtmp2, zero );
-			rc = rc ? rc : alp::set( ztmp2, zero );
-			for( size_t i = 0 ; i < n ; ++i ) {
-				dtmp2[ i ] = dtmp[ isort_dtmp[ i ] ];
-				ztmp2[ i ] = z[ isort_dtmp[ i ] ];
-			}
+			auto dtmp2 = alp::get_view< alp::structures::General >(
+				dtmp,
+				permutation_vec
+			);
+			auto ztmp2 = alp::get_view< alp::structures::General >(
+				z,
+				permutation_vec
+			);
 #ifdef DEBUG
 			print_vector( "  dtmp2  ", dtmp2 );
 			print_vector( "  ztmp2  ", ztmp2 );
@@ -497,32 +537,25 @@ namespace alp {
 			rc = rc ? rc : alp::set( d, zero );
 			Matrix< D, OrthogonalType, Dense > QdOuter( n );
 			rc = rc ? rc : alp::set( QdOuter, zero );
-			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter, dtmp2, ztmp2 );
+			auto QdOuter2 = alp::get_view< alp::structures::Orthogonal >(
+				QdOuter, permutation_vec, permutation_vec
+			);
 
 #ifdef DEBUG
-			print_matrix( "  QdOuter  ", QdOuter );
+			print_matrix( "  QdOuter(in)  ", QdOuter );
 #endif
-
-			// temp
-			// unpermute cols into QdOuterUnpermuted
-			Matrix< D, OrthogonalType, Dense > QdOuterUnpermuted( n );
-			rc = rc ? rc : alp::set( QdOuterUnpermuted, zero );
-			for( size_t i = 0 ; i < n ; ++i ) {
-				auto vin = get_view( QdOuter, utils::range( 0, n ), i );
-				auto vout = get_view( QdOuterUnpermuted, utils::range( 0, n ), isort_dtmp[ i ] );
-				rc = rc ? rc : alp::set( vout, vin );
-			}
-
+			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter2, dtmp2, ztmp2 );
 #ifdef DEBUG
-			print_matrix( "  QdOuterUnpermuted  ", QdOuterUnpermuted );
+			print_matrix( "  QdOuter(out)  ", QdOuter );
 #endif
 
+
 			// Q=U.dot((V[:,iiinv]).T)
 			rc = rc ? rc : alp::set( Q, zero );
 			rc = rc ? rc : mxm(
 				Q,
 				U,
-				alp::get_view< alp::view::transpose >( QdOuterUnpermuted ),
+				alp::get_view< alp::view::transpose >( QdOuter ),
 				ring
 			);
 

From 633e1401d8884079dcb08640f366b80887f3d902 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Wed, 19 Oct 2022 11:39:51 +0200
Subject: [PATCH 06/14] functional version

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 169 ++++++++++++------
 1 file changed, 118 insertions(+), 51 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index f33690422..2c935804a 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -60,10 +60,10 @@ namespace alp {
 		) {
 			RC rc = SUCCESS;
 
-#ifdef DEBUG
-			std::cout << " a = " << *a << " ";
-			std::cout << " b = " << *b << " ";
-#endif
+// #ifdef DEBUG
+// 			std::cout << " a = " << *a << " ";
+// 			std::cout << " b = " << *b << " ";
+// #endif
 
 			const Scalar< D > zero( ring.template getZero< D >() );
 			const Scalar< D > one( ring.template getOne< D >() );
@@ -88,10 +88,10 @@ namespace alp {
 				v
 			);
 
-#ifdef DEBUG
-			std::cout << " x0 = " << *x0 << " ";
-			std::cout << " fx0 = " << *fx0 << "\n";
-#endif
+// #ifdef DEBUG
+// 			std::cout << " x0 = " << *x0 << " ";
+// 			std::cout << " fx0 = " << *fx0 << "\n";
+// #endif
 
 			if( std::abs( *fx0 ) < tol ) {
 				alp::set( lambda, x0 );
@@ -191,52 +191,33 @@ namespace alp {
 			auto egvals_direct = get_view< alp::structures::General >( egvals, select_direct );
 			auto egvals_non_direct = get_view< alp::structures::General >( egvals, select_non_direct );
 
-			auto Egvecs_direct = alp::get_view< alp::structures::Orthogonal >(
-				Egvecs, select_direct, select_direct
-			);
+			// not needed as Q is alrady set to identity
+			// auto Egvecs_direct = alp::get_view< alp::structures::Orthogonal >(
+			// 	Egvecs, select_direct, select_direct
+			// );
 			auto Egvecs_non_direct = alp::get_view< alp::structures::Orthogonal >(
 				Egvecs, select_non_direct, select_non_direct
 			);
 
+			// copy d -> egvals for direct part
+			rc = rc ? rc : alp::set(
+				egvals_direct,
+				get_view< alp::structures::General >( d, select_direct )
+			);
 
-			// Vector< D, structures::General, Dense > d_nontrv( n );
-			// Vector< D, structures::General, Dense > v_nontrv( n );
-			// alp::set( d_nontrv, zero );
-			// alp::set( v_nontrv, zero );
-
-			// for( size_t i = 0; i < n; i++ ) {
-			// 	if( std::abs( v[ i ] ) < eps ) {
-			// 		//simple egval formula ;
-			// 		//set eigenvalue
-			// 		egvals[ i ] = d[ i ];
-			// 		//set eigenvector
-			// 		//(could be done without temp vector by using eWiseLambda)
-			// 		Vector< D, structures::General, Dense > dvec( n );
-			// 		alp::set( dvec, zero );
-			// 		dvec[ i ] = *one;
-			// 		auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, n ), i );
-			// 		rc = rc ? rc : alp::set( Egvecs_vec_view, dvec );
-			// 	} else {
-			// 		//complicated egval formula ;
-			// 		d_nontrv[ non_trivial_egvc_count ] = d[ i ];
-			// 		v_nontrv[ non_trivial_egvc_count ] = v[ i ];
-			// 		++non_trivial_egvc_count;
-			// 	}
-			// }
+			//rc = rc ? rc : alp::set( Egvecs_non_direct, one );
+			//rc = rc ? rc : alp::set( egvals_non_direct, one );
 
-			// auto d_nontrv_nnz_view = get_view( d_nontrv, utils::range( 0, non_trivial_egvc_count ) );
-			// auto v_nontrv_nnz_view = get_view( v_nontrv, utils::range( 0, non_trivial_egvc_count ) );
+			auto d_view = get_view< alp::structures::General >( d, select_non_direct );
+			auto v_view = get_view< alp::structures::General >( v, select_non_direct );
+
+#ifdef DEBUG
+			print_vector( "eigensolveDiagPlusOuter: d ", d );
+			print_vector( "eigensolveDiagPlusOuter: v ", v );
+			print_vector( "eigensolveDiagPlusOuter: d_view ", d_view );
+			print_vector( "eigensolveDiagPlusOuter: v_view ", v_view );
 
-			// Vector< D, structures::General, Dense > egvals_nontrv( non_trivial_egvc_count );
-			// Matrix< D, OrthogonalType, Dense > Egvecs_nontrv( non_trivial_egvc_count );
-			// rc = rc ? rc : alp::set( egvals_nontrv, zero );
-			// rc = rc ? rc : alp::set( Egvecs_nontrv, zero );
 
-// #ifdef DEBUG
-// 			print_vector( "eigensolveDiagPlusOuter: d ", d );
-// 			print_vector( "eigensolveDiagPlusOuter: v ", v );
-// 			print_vector( "eigensolveDiagPlusOuter: d_nontrv_nnz_view ", d_nontrv_nnz_view );
-// 			print_vector( "eigensolveDiagPlusOuter: v_nontrv_nnz_view ", v_nontrv_nnz_view );
 
 // 			// for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
 // 			// 	std::cout << " ============ i= " << i << "  ============\n";
@@ -275,7 +256,76 @@ namespace alp {
 // 			// 	rc = rc ? rc : bisec_sec_eq( lambda, d_nontrv_nnz_view, v_nontrv_nnz_view, a, b );
 // 			// 	std::cout << " lambda (" << i << ") = " << *lambda << "\n";
 // 			}
-// #endif
+#endif
+
+			/////////////////// OK code //////////////////////////////
+
+			// vec_b = {d_view[1], d_view[2], ... , d_view[N-1], d_view[N]+dot(v,v) }
+			size_t nn = alp::getLength( d_view );
+			alp::Vector< D > vec_b( nn );
+			auto v1 = get_view( vec_b, utils::range( 0, nn - 1 ) );
+			auto v2 = get_view( d_view, utils::range( 1, nn ) );
+			rc = rc ? rc : alp::set( v1, v2 );
+			auto v3 = get_view( vec_b, utils::range( nn - 1, nn ) );
+			auto v4 = get_view( d_view, utils::range( nn - 1, nn ) );
+			rc = rc ? rc : alp::set( v3, v4 );
+			Scalar< D > alpha( zero );
+			rc = rc ? rc : dot( alpha, d_view, d_view, ring );
+			auto v5 = get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
+			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
+
+			alp::Vector< D > vec_temp_egvals( nn );
+			alp::Vector< D > vec_temp_d( nn );
+			alp::Vector< D > vec_temp_v( nn );
+
+			rc = rc ? rc : alp::set( vec_temp_egvals, zero );
+			rc = rc ? rc : alp::set( vec_temp_d, d_view );
+			rc = rc ? rc : alp::set( vec_temp_v, v_view );
+
+			rc = rc ? rc : eWiseLambda(
+				[ &d_view, &vec_temp_v, &vec_b ]( const size_t i, D &val ) {
+					Scalar< D > a( d_view[ i ] );
+					Scalar< D > b( vec_b[ i ] );
+					Scalar< D > w( ( *a + *b ) / 2 );
+					bisec_sec_eq( w, d_view, vec_temp_v, a, b );
+					val = *w;
+				},
+				vec_temp_egvals
+			);
+			rc = rc ? rc : alp::set( egvals_non_direct, vec_temp_egvals );
+
+			// until fold vec -> matrix (or scatter) is implemented
+			// we have to use this for loop
+			for( size_t i = 0; i < nn; i++ ) {
+				auto egvecs_view = get_view( Egvecs_non_direct, utils::range( 0, nn ), i );
+				alp::set( egvecs_view, vec_temp_v );
+#ifdef DEBUG
+			print_vector( "-----> egvecs_view(0) ", egvecs_view );
+#endif
+				alp::set( vec_temp_egvals, vec_temp_d );
+#ifdef DEBUG
+			print_vector( "-----> egvecs_view(1) ", vec_temp_egvals );
+#endif
+				Scalar< D > lambda_i( egvals_non_direct[ i ] );
+				rc = rc ? rc : alp::foldl( vec_temp_egvals, lambda_i, minus );
+#ifdef DEBUG
+			print_vector( "-----> egvecs_view(2) ", vec_temp_egvals );
+#endif
+				rc = rc ? rc : alp::foldl( egvecs_view, vec_temp_egvals , divide );
+#ifdef DEBUG
+			print_vector( "-----> egvecs_view(3) ", vec_temp_egvals );
+#endif
+				Scalar< D > norm1( zero );
+				rc = rc ? rc : norm2( norm1, egvecs_view, ring );
+				rc = rc ? rc : alp::foldl( egvecs_view, norm1 , divide );
+			}
+
+
+#ifdef DEBUG
+			print_vector( "-----> d_view ", d_view );
+			print_vector( "-----> vec_b  ", vec_b );
+#endif
+			//////////////////////////////////////////////////////////
 
 
 // #ifdef TEMPDISABLE
@@ -451,9 +501,9 @@ namespace alp {
 			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
 			auto Udown = get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
 
-			// rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
-			// rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
-			std::cout << " --> ust one iteration\n";
+			rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
+			rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
+			//std::cout << " --> ust one iteration\n";
 
 #ifdef DEBUG
 			std::cout << " after symm_tridiag_dac_eigensolver call:\n";
@@ -492,9 +542,17 @@ namespace alp {
 #endif
 
 #ifdef DEBUG
+// 			//testis
+// 			std::vector< double > xdtmp{ 1, 4, 2, 10, -1, 3};
+// 			std::vector< double > xztmp{ 1, 2, 1, 1.e-12, -1, 1.e-12};
+// 			alp::buildVector( dtmp, xdtmp.begin(), xdtmp.end() );
+// 			alp::buildVector( z, xztmp.begin(), xztmp.end() );
+// //test
+
 			print_vector( "  z  ", z );
 #endif
 
+
 			// permutations which sort dtmp
 			std::vector< size_t > isort_dtmp( n, 0 );
 			for( size_t i = 0 ; i < n ; ++i ) {
@@ -537,16 +595,25 @@ namespace alp {
 			rc = rc ? rc : alp::set( d, zero );
 			Matrix< D, OrthogonalType, Dense > QdOuter( n );
 			rc = rc ? rc : alp::set( QdOuter, zero );
+			{
+				auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
+				rc = rc ? rc : alp::set(
+					QdOuter_diag,
+					one
+				);
+			}
+
 			auto QdOuter2 = alp::get_view< alp::structures::Orthogonal >(
 				QdOuter, permutation_vec, permutation_vec
 			);
-
 #ifdef DEBUG
 			print_matrix( "  QdOuter(in)  ", QdOuter );
+			print_vector( "  d(in)  ", d );
 #endif
 			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter2, dtmp2, ztmp2 );
 #ifdef DEBUG
 			print_matrix( "  QdOuter(out)  ", QdOuter );
+			print_vector( "  d(out)  ", d );
 #endif
 
 

From b0f5150517a7a898da4c09a3733592e8b9920302 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Thu, 20 Oct 2022 12:35:01 +0200
Subject: [PATCH 07/14] working but unstable version numerical correctness
 skipped

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 216 +++--------
 include/alp/structures.hpp                    |   7 +-
 tests/smoke/alp_stedc.cpp                     | 346 ++++++++----------
 3 files changed, 222 insertions(+), 347 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 2c935804a..f6d7d3888 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -1,5 +1,5 @@
 /*
- *   Copyright 2021 Huawei Technologies Co., Ltd.
+ *   Copyright 2022 Huawei Technologies Co., Ltd.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,7 +19,9 @@
 
 #include <alp.hpp>
 #include <graphblas/utils/iscomplex.hpp> // use from grb
+#ifdef DEBUG
 #include "../tests/utils/print_alp_containers.hpp"
+#endif
 
 // TEMPDISABLE should be removed in the final version
 #define TEMPDISABLE
@@ -53,18 +55,13 @@ namespace alp {
 			Vector<	D, structures::General,	Dense, VecView2, VecImfR2, VecImfC2 > &v,
 			const Scalar< D > &a,
 			const Scalar< D > &b,
-			const D tol=1.e-12,
-			const Ring & ring = Ring(),
-			const Minus & minus = Minus(),
-			const Divide & divide = Divide()
+			const D tol = 1.e-10,
+			const Ring &ring = Ring(),
+			const Minus &minus = Minus(),
+			const Divide &divide = Divide()
 		) {
 			RC rc = SUCCESS;
 
-// #ifdef DEBUG
-// 			std::cout << " a = " << *a << " ";
-// 			std::cout << " b = " << *b << " ";
-// #endif
-
 			const Scalar< D > zero( ring.template getZero< D >() );
 			const Scalar< D > one( ring.template getOne< D >() );
 			Scalar< D > x0( ( *a + *b ) / ( 2 ) );
@@ -88,11 +85,6 @@ namespace alp {
 				v
 			);
 
-// #ifdef DEBUG
-// 			std::cout << " x0 = " << *x0 << " ";
-// 			std::cout << " fx0 = " << *fx0 << "\n";
-// #endif
-
 			if( std::abs( *fx0 ) < tol ) {
 				alp::set( lambda, x0 );
 				return rc;
@@ -147,10 +139,11 @@ namespace alp {
 			Matrix< D, OrthogonalType, Dense, OrthViewType, OrthViewImfR, OrthViewImfC > &Egvecs,
 			Vector<	D, structures::General, Dense, VecView2, VecImfR2, VecImfC2 > &d,
 			Vector< D, structures::General, Dense, VecView3, VecImfR3, VecImfC3 > &v,
-			const Ring & ring = Ring(),
-			const Minus & minus = Minus(),
-			const Divide & divide = Divide()
+			const Ring &ring = Ring(),
+			const Minus &minus = Minus(),
+			const Divide &divide = Divide()
 		) {
+			(void)minus;
 			RC rc = SUCCESS;
 
 			const Scalar< D > zero( ring.template getZero< D >() );
@@ -168,11 +161,14 @@ namespace alp {
 
 			for( size_t i = 0; i < n; i++ ) {
 				if( std::abs( v[ i ] ) < eps ) {
-					//simple egval formula ;
+					// in these cases equals are canonical vectors
+					// and eigenvalues are d[i]
 					direct_egvc_indx[ count_direct_egvc ] = i ;
 					++count_direct_egvc;
 				} else {
-					//complicated egval formula ;
+					// these cases require complicated egval formula
+					// and for cases where egval is close to the singular point
+					// different algorithm for eigenvectors needs to be implemented
 					non_direct_egvc_indx[ count_non_direct_egvc ] = i;
 					++count_non_direct_egvc;
 				}
@@ -185,8 +181,8 @@ namespace alp {
 			alp::buildVector( select_non_direct, non_direct_egvc_indx.begin(), non_direct_egvc_indx.end() );
 
 #ifdef DEBUG
-			std::cout << " count_direct_egvc = " << count_direct_egvc << "\n";
-			std::cout << " count_non_direct_egvc = " << count_non_direct_egvc << "\n";
+			std::cout << " ---->     count_direct_egvc = " << count_direct_egvc << "\n";
+			std::cout << " ----> count_non_direct_egvc = " << count_non_direct_egvc << "\n";
 #endif
 			auto egvals_direct = get_view< alp::structures::General >( egvals, select_direct );
 			auto egvals_non_direct = get_view< alp::structures::General >( egvals, select_non_direct );
@@ -205,9 +201,6 @@ namespace alp {
 				get_view< alp::structures::General >( d, select_direct )
 			);
 
-			//rc = rc ? rc : alp::set( Egvecs_non_direct, one );
-			//rc = rc ? rc : alp::set( egvals_non_direct, one );
-
 			auto d_view = get_view< alp::structures::General >( d, select_non_direct );
 			auto v_view = get_view< alp::structures::General >( v, select_non_direct );
 
@@ -216,50 +209,8 @@ namespace alp {
 			print_vector( "eigensolveDiagPlusOuter: v ", v );
 			print_vector( "eigensolveDiagPlusOuter: d_view ", d_view );
 			print_vector( "eigensolveDiagPlusOuter: v_view ", v_view );
-
-
-
-// 			// for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-// 			// 	std::cout << " ============ i= " << i << "  ============\n";
-
-// 			// 	std::cout << " d = array([";
-// 			// 	for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-// 			// 		std::cout << d_nontrv_nnz_view[ i ] << ", ";
-// 			// 	}
-// 			// 	std::cout << " ])\n";
-// 			// 	std::cout << " v = array([";
-// 			// 	for( size_t i = 0; i < non_trivial_egvc_count; ++i ) {
-// 			// 		std::cout << v_nontrv_nnz_view[ i ] << ", ";
-// 			// 	}
-// 			// 	std::cout << " ])\n";
-
-// 			// 	Scalar< D > a( d_nontrv_nnz_view[ i ] );
-// 			// 	Scalar< D > b( d_nontrv_nnz_view[ i ] );
-// 			// 	std::cout << "0 a,b=" << *a << " " << *b << "\n";
-// 			// 	if( i + 1 < non_trivial_egvc_count  ) {
-// 			// 		std::cout << " alp::set b to <<" << d_nontrv_nnz_view[ i + 1 ] << ">> \n";
-// 			// 		rc = alp::set( b, Scalar< D >( d_nontrv_nnz_view[ i + 1 ] ) );
-// 			// 		if( rc != SUCCESS ) {
-// 			// 			std::cout << " **** alp::set failed ***** \n";
-// 			// 		}
-// 			// 		std::cout << "1  a,b=" << *a << " " << *b << "\n";
-// 			// 	} else {
-// 			// 		Scalar< D > alpha( zero );
-// 			// 		rc = rc ? rc : norm2( alpha, v, ring );
-// 			// 		foldl( b, alpha, ring.getAdditiveOperator() );
-// 			// 		std::cout << "2 a,b=" << *a << " " << *b << "\n";
-// 			// 	}
-// 			// 	Scalar< D > lambda( ( *a - *b ) / 2 );
-
-// 			// 	std::cout << " a,lambda,b=" << *a << " " << *lambda << " " << *b << "\n";
-
-// 			// 	rc = rc ? rc : bisec_sec_eq( lambda, d_nontrv_nnz_view, v_nontrv_nnz_view, a, b );
-// 			// 	std::cout << " lambda (" << i << ") = " << *lambda << "\n";
-// 			}
 #endif
 
-			/////////////////// OK code //////////////////////////////
-
 			// vec_b = {d_view[1], d_view[2], ... , d_view[N-1], d_view[N]+dot(v,v) }
 			size_t nn = alp::getLength( d_view );
 			alp::Vector< D > vec_b( nn );
@@ -269,11 +220,10 @@ namespace alp {
 			auto v3 = get_view( vec_b, utils::range( nn - 1, nn ) );
 			auto v4 = get_view( d_view, utils::range( nn - 1, nn ) );
 			rc = rc ? rc : alp::set( v3, v4 );
-			Scalar< D > alpha( zero );
-			rc = rc ? rc : dot( alpha, d_view, d_view, ring );
-			auto v5 = get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
-			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
 
+			// eWiseLambda currently does not work with select view
+			// dot does not work with select view
+			// as a temp solutions we make temp vectors 
 			alp::Vector< D > vec_temp_egvals( nn );
 			alp::Vector< D > vec_temp_d( nn );
 			alp::Vector< D > vec_temp_v( nn );
@@ -282,6 +232,14 @@ namespace alp {
 			rc = rc ? rc : alp::set( vec_temp_d, d_view );
 			rc = rc ? rc : alp::set( vec_temp_v, v_view );
 
+			Scalar< D > alpha( zero );
+			//rc = rc ? rc : dot( alpha, d_view, d_view, ring ); // bug!
+			rc = rc ? rc : dot( alpha, vec_temp_v, vec_temp_v, ring );
+
+			auto v5 = get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
+			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
+
+
 			rc = rc ? rc : eWiseLambda(
 				[ &d_view, &vec_temp_v, &vec_b ]( const size_t i, D &val ) {
 					Scalar< D > a( d_view[ i ] );
@@ -298,63 +256,20 @@ namespace alp {
 			// we have to use this for loop
 			for( size_t i = 0; i < nn; i++ ) {
 				auto egvecs_view = get_view( Egvecs_non_direct, utils::range( 0, nn ), i );
+				// //test
+				// alp::set( egvecs_view, Scalar< D >( i + 1 ) );
+				// //test
+
 				alp::set( egvecs_view, vec_temp_v );
-#ifdef DEBUG
-			print_vector( "-----> egvecs_view(0) ", egvecs_view );
-#endif
 				alp::set( vec_temp_egvals, vec_temp_d );
-#ifdef DEBUG
-			print_vector( "-----> egvecs_view(1) ", vec_temp_egvals );
-#endif
 				Scalar< D > lambda_i( egvals_non_direct[ i ] );
-				rc = rc ? rc : alp::foldl( vec_temp_egvals, lambda_i, minus );
-#ifdef DEBUG
-			print_vector( "-----> egvecs_view(2) ", vec_temp_egvals );
-#endif
+				rc = rc ? rc : alp::foldl( vec_temp_egvals, lambda_i , minus );
 				rc = rc ? rc : alp::foldl( egvecs_view, vec_temp_egvals , divide );
-#ifdef DEBUG
-			print_vector( "-----> egvecs_view(3) ", vec_temp_egvals );
-#endif
 				Scalar< D > norm1( zero );
 				rc = rc ? rc : norm2( norm1, egvecs_view, ring );
 				rc = rc ? rc : alp::foldl( egvecs_view, norm1 , divide );
 			}
 
-
-#ifdef DEBUG
-			print_vector( "-----> d_view ", d_view );
-			print_vector( "-----> vec_b  ", vec_b );
-#endif
-			//////////////////////////////////////////////////////////
-
-
-// #ifdef TEMPDISABLE
-// 			for( size_t i = 0; i < non_trivial_egvc_count; i++ ) {
-// 				egvals_nontrv[ i ] = d_nontrv[ i ];
-// 				Vector< D, structures::General, Dense > dvec( non_trivial_egvc_count );
-// 				alp::set( dvec, zero );
-// 				dvec[ i ] = *one;
-// 				auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), i );
-// 				rc = rc ? rc : alp::set( Egvecs_nontrv_vec_view, dvec );
-// 			}
-// #else
-// 			not implemented;
-// #endif
-
-// 			//copy egvals_nontrv and Egvecs_nontrv into egvals and Egvecs
-// 			size_t k = 0;
-// 			for( size_t i = 0; i < n; i++ ) {
-// 				if( !( std::abs( v[ i ] ) < eps ) ) {
-// 					egvals[ i ] = egvals_nontrv[ k ];
-// 					//resolve this with select/permute view
-// #ifdef TEMPDISABLE
-// 					auto Egvecs_nontrv_vec_view = get_view( Egvecs_nontrv, utils::range( 0, non_trivial_egvc_count ), k );
-// 					auto Egvecs_vec_view = get_view( Egvecs, utils::range( 0, non_trivial_egvc_count ), i ); // this is wrong
-// 					rc = rc ? rc : alp::set( Egvecs_vec_view, Egvecs_nontrv_vec_view );
-// #endif
-// 				}
-// 			}
-
 			return rc;
 		}
 
@@ -445,7 +360,7 @@ namespace alp {
 					},
 					T
 				);
-				// Q=array([[1]]);
+				// Q=[[1]]; a 1x1 matrix
 				rc = rc ? rc : alp::set( Q, one );
 
 				return rc;
@@ -473,13 +388,12 @@ namespace alp {
 			auto vvt =  alp::outer( v, ring.getMultiplicativeOperator() ) ;
 
 #ifdef DEBUG
-			print_matrix( " Atmp(0) = ", Atmp );
 			print_matrix( " vvt = ", vvt );
 #endif
 			rc = rc ? rc : alp::foldl( Atmp, vvt, minus );
 
 #ifdef DEBUG
-			print_matrix( " Atmp(1) = ", Atmp );
+			print_matrix( " Atmp(updated)  ", Atmp );
 #endif
 
 			auto Ttop = get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( 0, m ), utils::range( 0, m ) );
@@ -542,21 +456,16 @@ namespace alp {
 #endif
 
 #ifdef DEBUG
-// 			//testis
-// 			std::vector< double > xdtmp{ 1, 4, 2, 10, -1, 3};
-// 			std::vector< double > xztmp{ 1, 2, 1, 1.e-12, -1, 1.e-12};
-// 			alp::buildVector( dtmp, xdtmp.begin(), xdtmp.end() );
-// 			alp::buildVector( z, xztmp.begin(), xztmp.end() );
-// //test
-
+			print_vector( "  d  ", dtmp );
 			print_vector( "  z  ", z );
 #endif
 
-
 			// permutations which sort dtmp
 			std::vector< size_t > isort_dtmp( n, 0 );
+			std::vector< size_t > no_permute_data( n, 0 );
 			for( size_t i = 0 ; i < n ; ++i ) {
 				isort_dtmp[ i ] = i;
+				no_permute_data[ i ] = i;
 			}
 			std::sort(
 				isort_dtmp.begin(),
@@ -566,17 +475,9 @@ namespace alp {
 				}
 			);
 			alp::Vector< size_t > permutation_vec( n );
+			alp::Vector< size_t > no_permutation_vec( n );
 			alp::buildVector( permutation_vec, isort_dtmp.begin(), isort_dtmp.end() );
-
-#ifdef DEBUG
-			print_vector( "  dtmp  ", dtmp );
-			// std::cout << " sort(dtmp) = \n";
-			// std::cout << "    [ ";
-			// for( size_t i = 0 ; i < n ; ++i ) {
-			// 	std::cout << "\t" << dtmp[ isort_dtmp[ i ] ];
-			// }
-			// std::cout << " ]\n";
-#endif
+			alp::buildVector( no_permutation_vec, no_permute_data.begin(), no_permute_data.end() );
 
 			auto dtmp2 = alp::get_view< alp::structures::General >(
 				dtmp,
@@ -595,36 +496,29 @@ namespace alp {
 			rc = rc ? rc : alp::set( d, zero );
 			Matrix< D, OrthogonalType, Dense > QdOuter( n );
 			rc = rc ? rc : alp::set( QdOuter, zero );
-			{
-				auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
-				rc = rc ? rc : alp::set(
-					QdOuter_diag,
-					one
-				);
-			}
+			auto QdOuter_diag = alp::get_view< alp::view::diagonal >( QdOuter );
+			rc = rc ? rc : alp::set(
+				QdOuter_diag,
+				one
+			);
 
 			auto QdOuter2 = alp::get_view< alp::structures::Orthogonal >(
-				QdOuter, permutation_vec, permutation_vec
+				QdOuter, permutation_vec, no_permutation_vec
 			);
-#ifdef DEBUG
-			print_matrix( "  QdOuter(in)  ", QdOuter );
-			print_vector( "  d(in)  ", d );
-#endif
+
 			rc = rc ? rc : eigensolveDiagPlusOuter( d, QdOuter2, dtmp2, ztmp2 );
 #ifdef DEBUG
-			print_matrix( "  QdOuter(out)  ", QdOuter );
 			print_vector( "  d(out)  ", d );
+			print_matrix( "  QdOuter(out)  ", QdOuter );
+			print_matrix( "  U  ", U );
 #endif
 
-
-			// Q=U.dot((V[:,iiinv]).T)
 			rc = rc ? rc : alp::set( Q, zero );
-			rc = rc ? rc : mxm(
-				Q,
-				U,
-				alp::get_view< alp::view::transpose >( QdOuter ),
-				ring
-			);
+			rc = rc ? rc : mxm( Q, U, QdOuter, ring	);
+
+#ifdef DEBUG
+			print_matrix( "  Q = U x Q   ", Q );
+#endif
 
 			return rc;
 		}
diff --git a/include/alp/structures.hpp b/include/alp/structures.hpp
index 950f6204b..93a51662a 100644
--- a/include/alp/structures.hpp
+++ b/include/alp/structures.hpp
@@ -633,7 +633,12 @@ namespace alp {
 		struct isInstantiable< Orthogonal, Orthogonal > {
 			template< typename ImfR, typename ImfC >
 			static bool check( const ImfR &imf_r, const ImfC &imf_c ) {
-				return imf_r.isSame(imf_c);
+				// This chek has to further improved.
+				// Orthogonal matrix in the current implemenation
+				// means full-rank square othogonal matrix.
+				// Rectangular matrix orthogonal only by rows (or columns)
+				// does not fit into the current Orthogonal structure.
+				return imf_r.n == imf_c.n ;
 			};
 		};
 
diff --git a/tests/smoke/alp_stedc.cpp b/tests/smoke/alp_stedc.cpp
index e873ed7b7..0f6d9b6a5 100644
--- a/tests/smoke/alp_stedc.cpp
+++ b/tests/smoke/alp_stedc.cpp
@@ -1,5 +1,5 @@
 /*
- *   Copyright 2021 Huawei Technologies Co., Ltd.
+ *   Copyright 2022 Huawei Technologies Co., Ltd.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,49 +18,31 @@
 #include <sstream>
 #include <vector>
 
-// currently only real version
-// #ifdef _COMPLEX
-// #include <complex>
-// #include <cmath>
-// #include <iomanip>
-// #endif
-
-#define DEBUG
-
 #include <alp.hpp>
 #include <alp/algorithms/symm_tridiag_eigensolver.hpp>
 #include <graphblas/utils/iscomplex.hpp> // use from grb
+#ifdef DEBUG
 #include "../utils/print_alp_containers.hpp"
-
-//once TEMPDISABLE is removed the code should be in the final version
-#define TEMPDISABLE
+#endif
 
 using namespace alp;
 
 using BaseScalarType = double;
 using Orthogonal = structures::Orthogonal;
 
-// #ifdef _COMPLEX
-// using ScalarType = std::complex< BaseScalarType >;
-// //not fully implemented structures
-// using HermitianOrSymmetricTridiagonal = structures::HermitianTridiagonal;
-// using HermitianOrSymmetric = structures::Hermitian;
-// #else
 using ScalarType = BaseScalarType;
 
-//temp
+// not fully implemented structures
 using HermitianOrSymmetricTridiagonal = structures::SymmetricTridiagonal;
-//using HermitianOrSymmetricTridiagonal = structures::Square;
 
 //fully implemented structures
 using HermitianOrSymmetric = structures::Symmetric;
-// #endif
 
-constexpr BaseScalarType tol = 1.e-10;
+constexpr BaseScalarType tol = 1.e-5;
 constexpr size_t RNDSEED = 11235;
 
-//temp function untill Hermitian containter is implemented
-//** gnerate symmetric-hermitian matrix in a square container */
+//temp function untill (tridiagonal)Hermitian containter is implemented
+//** gnerate tridiagonal-symmetric-hermitian matrix in a rectangular container */
 template<
 	typename T
 >
@@ -84,7 +66,7 @@ std::vector< T > generate_symmherm_tridiag_matrix_data(
 	return data;
 }
 
-//** generate upper/lower triangular part of a Symmetric matrix */
+//** generate_symmherm_tridiag_matrix_data: real numbers version*/
 template<
 	typename T
 >
@@ -107,151 +89,145 @@ std::vector< T >  generate_symmherm_tridiag_matrix_data(
 	return data;
 }
 
-// //** check if rows/columns or matrix Q are orthogonal */
-// template<
-// 	typename T,
-// 	typename Structure,
-// 	typename ViewType,
-// 	class Ring = Semiring< operators::add< T >, operators::mul< T >, identities::zero, identities::one >
-// >
-// RC check_overlap( alp::Matrix< T, Structure, alp::Density::Dense, ViewType > &Q, const Ring & ring = Ring() ) {
-// 	RC rc = SUCCESS;
-// 	const size_t n = nrows( Q );
-// #ifdef DEBUG
-// 	std::cout << "Overlap matrix for Q:\n";
-// #endif
-// 	for ( size_t i = 0; i < n; ++i ) {
-// 		auto vi = get_view( Q, i, utils::range( 0, n ) );
-// 		for ( size_t j = 0; j < n; ++j ) {
-// 			auto vj = get_view( Q, j, utils::range( 0, n ) );
-// 			Scalar< T > alpha( ring.template getZero< T >() );
-// 			rc = dot( alpha, vi, vj, ring );
-// 			if( rc != SUCCESS ) {
-// 				std::cerr << " dot( alpha, vi, vj, ring ) failed\n";
-// 				return PANIC;
-// 			}
-// 			if( i == j ) {
-// 				if( std::abs( *alpha - ring.template getOne< T >() ) > tol ) {
-// 					std::cerr << " vector " << i << " not normalized\n";
-// 					return PANIC;
-// 				}
-// 			} else {
-// 				if( std::abs( *alpha ) > tol ) {
-// 					std::cerr << " vector " << i << " and vctor " << j << " are note orthogonal\n";
-// 					return PANIC;
-// 				}
-// 			}
-// #ifdef DEBUG
-// 			std::cout << "\t" << std::abs( *alpha );
-// #endif
-// 		}
-// #ifdef DEBUG
-// 		std::cout << "\n";
-// #endif
-// 	}
-// #ifdef DEBUG
-// 	std::cout << "\n";
-// #endif
-// 	return rc;
-// }
-
-
-// //** check solution by calculating H-QTQh */
-// template<
-// 	typename D,
-// 	typename StructureSymm,
-// 	typename StructureOrth,
-// 	typename StructureTrDg,
-// 	class Minus = operators::subtract< D >,
-// 	class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >
-// >
-// RC check_solution(
-// 	alp::Matrix< D, StructureSymm, alp::Density::Dense > &H,
-// 	alp::Matrix< D, StructureOrth, alp::Density::Dense > &Q,
-// 	alp::Matrix< D, StructureTrDg, alp::Density::Dense > &T,
-// 	const Ring &ring = Ring(),
-// 	const Minus &minus = Minus()
-// ) {
-// 	RC rc = SUCCESS;
-// 	const size_t n = nrows( Q );
-
-// #ifdef DEBUG
-// 	std::cout << " ** check_solution **\n";
-// 	std::cout << " input matrices:\n";
-// 	print_matrix( " << H >> ", H );
-// 	print_matrix( " << Q >> ", Q );
-// 	print_matrix( " << T >> ", T );
-// 	std::cout << " ********************\n";
-// #endif
-
-// 	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > QTQh( n );
-// 	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > QTQhmH( n );
-// 	const Scalar< D > zero( ring.template getZero< D >() );
-
-// 	rc = rc ? rc : set( QTQh, zero );
-// 	rc = rc ? rc : mxm( QTQh, T, conjugate( alp::get_view< alp::view::transpose >( Q ) ), ring );
-// 	rc = rc ? rc : set( QTQhmH, zero );
-// 	rc = rc ? rc : mxm( QTQhmH, Q, QTQh, ring );
-// 	rc = rc ? rc : set( QTQh, QTQhmH );
-// #ifdef DEBUG
-// 	print_matrix( " << QTQhmH >> ", QTQhmH );
-// 	print_matrix( " << H >> ", H );
-// 	std::cout << "call foldl( mat, mat, minus )\n";
-// #endif
-
-// #ifndef TEMPDISABLE
-// 	rc = foldl( QTQhmH, H, minus );
-// #else
-// 	rc = rc ? rc : alp::eWiseLambda(
-// 		[ &H, &minus, &zero ]( const size_t i, const size_t j, D &val ) {
-// 			if ( j >= i ) {
-// 				internal::foldl(
-// 					val,
-// 					internal::access( H, internal::getStorageIndex( H, i, j ) ),
-// 					minus
-// 				);
-// 			} else {
-// 				val = *zero;
-// 			}
-// 		},
-// 		QTQhmH
-// 	);
-// #endif
-
-// #ifdef DEBUG
-// 	print_matrix( " << QTQhmH >> ", QTQhmH );
-// 	print_matrix( " << H >> ", H );
-// #endif
-
-// 	//Frobenius norm
-// 	D fnorm = ring.template getZero< D >();
-// 	rc = rc ? rc : alp::eWiseLambda(
-// 		[ &fnorm, &ring ]( const size_t i, const size_t j, D &val ) {
-// 			(void) i;
-// 			(void) j;
-// 			internal::foldl( fnorm, val * val, ring.getAdditiveOperator() );
-// 		},
-// 		QTQhmH
-// 	);
-// 	fnorm = std::sqrt( fnorm );
-
-// #ifdef DEBUG
-// 	std::cout << " FrobeniusNorm(H-QTQh) = " << std::abs( fnorm ) << "\n";
-// #endif
-// 	if( tol < std::abs( fnorm ) ) {
-// #ifdef DEBUG
-// 		std::cout << " ----------------------\n";
-// 		std::cout << " compare matrices\n";
-// 		print_matrix( " << H >> ", H );
-// 		print_matrix( " << QTQh >> ", QTQh );
-// 		std::cout << " ----------------------\n";
-// #endif
-// 		std::cout << "The Frobenius norm is too large.\n";
-// 		return FAILED;
-// 	}
-
-// 	return rc;
-// }
+//** check if rows/columns or matrix Q are orthogonal */
+template<
+	typename T,
+	typename Structure,
+	typename ViewType,
+	class Ring = Semiring< operators::add< T >, operators::mul< T >, identities::zero, identities::one >,
+	class Minus = operators::subtract< T >
+>
+RC check_overlap(
+	alp::Matrix< T, Structure, alp::Density::Dense, ViewType > &Q,
+	const Ring &ring = Ring(),
+	const Minus &minus = Minus()
+) {
+	const Scalar< T > zero( ring.template getZero< T >() );
+	const Scalar< T > one( ring.template getOne< T >() );
+
+	RC rc = SUCCESS;
+	const size_t n = nrows( Q );
+
+	// check if QxQt == I
+	alp::Matrix< T, Structure, alp::Density::Dense, ViewType > Qtmp( n );
+	rc = rc ? rc : set( Qtmp, zero );
+	rc = rc ? rc : mxm(
+		Qtmp,
+		Q,
+		conjugate( alp::get_view< alp::view::transpose >( Q ) ),
+		ring
+	);
+	Matrix< T, Structure, Dense > Identity( n );
+	rc = rc ? rc : alp::set( Identity, zero );
+	auto id_diag = alp::get_view< alp::view::diagonal >( Identity );
+	rc = rc ? rc : alp::set( id_diag, one );
+	rc = rc ? rc : foldl( Qtmp, Identity, minus );
+
+	//Frobenius norm
+	T fnorm = ring.template getZero< T >();
+	rc = rc ? rc : alp::eWiseLambda(
+		[ &fnorm, &ring ]( const size_t i, const size_t j, T &val ) {
+			(void) i;
+			(void) j;
+			internal::foldl( fnorm, val * val, ring.getAdditiveOperator() );
+		},
+		Qtmp
+	);
+	fnorm = std::sqrt( fnorm );
+
+#ifdef DEBUG
+	std::cout << " FrobeniusNorm(QQt - I) = " << std::abs( fnorm ) << "\n";
+#endif
+	if( tol < std::abs( fnorm ) ) {
+		std::cout << "The Frobenius norm is too large: " << std::abs( fnorm ) << ".\n";
+		return FAILED;
+	}
+
+	return rc;
+}
+
+
+//** check solution by calculating A x Q - Q x diag(d) */
+template<
+	typename D,
+	typename SymmOrHermTridiagonalType,
+	typename OrthogonalType,
+	typename SymmHermTrdiViewType,
+	typename OrthViewType,
+	typename SymmHermTrdiImfR,
+	typename SymmHermTrdiImfC,
+	typename OrthViewImfR,
+	typename OrthViewImfC,
+	typename VecViewType,
+	typename VecImfR,
+	typename VecImfC,
+	class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
+	class Minus = operators::subtract< D >,
+	class Divide = operators::divide< D >
+>
+RC check_solution(
+	Matrix< D, SymmOrHermTridiagonalType, Dense, SymmHermTrdiViewType, SymmHermTrdiImfR, SymmHermTrdiImfC > &T,
+	Matrix<	D, OrthogonalType, Dense, OrthViewType, OrthViewImfR, OrthViewImfC > &Q,
+	Vector<	D, structures::General, Dense, VecViewType, VecImfR, VecImfC > &d,
+	const Ring & ring = Ring(),
+	const Minus & minus = Minus(),
+	const Divide & divide = Divide()
+) {
+	(void)ring;
+	(void)minus;
+	(void)divide;
+	RC rc = SUCCESS;
+
+ 	const size_t n = nrows( Q );
+
+#ifdef DEBUG
+	print_matrix( " T ", T  );
+	print_matrix( " Q ", Q  );
+	print_vector( " d ", d  );
+#endif
+
+	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > Left( n );
+	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > Right( n );
+	alp::Matrix< D, alp::structures::Square, alp::Density::Dense > Dmat( n );
+	const Scalar< D > zero( ring.template getZero< D >() );
+	const Scalar< D > one( ring.template getOne< D >() );
+
+	rc = rc ? rc : set( Left, zero );
+	rc = rc ? rc : mxm( Left, T, Q, ring );
+
+	rc = rc ? rc : set( Dmat, zero );
+	auto D_diag = alp::get_view< alp::view::diagonal >( Dmat );
+	rc = rc ? rc : set( D_diag, d );
+	rc = rc ? rc : set( Right, zero );
+	rc = rc ? rc : mxm( Right, Q, Dmat, ring );
+#ifdef DEBUG
+	print_matrix( " TxQ ", Left  );
+	print_matrix( " QxD ", Right  ),
+#endif
+	rc = rc ? rc : foldl( Left, Right, minus );
+
+	//Frobenius norm
+	D fnorm = ring.template getZero< D >();
+	rc = rc ? rc : alp::eWiseLambda(
+		[ &fnorm, &ring ]( const size_t i, const size_t j, D &val ) {
+			(void) i;
+			(void) j;
+			internal::foldl( fnorm, val * val, ring.getAdditiveOperator() );
+		},
+		Left
+	);
+	fnorm = std::sqrt( fnorm );
+
+#ifdef DEBUG
+	std::cout << " FrobeniusNorm(AQ-QD) = " << std::abs( fnorm ) << "\n";
+#endif
+	if( tol < std::abs( fnorm ) ) {
+		std::cout << "The Frobenius norm is too large: " << std::abs( fnorm ) << ".\n";
+		return FAILED;
+	}
+
+	return rc;
+}
 
 
 
@@ -281,12 +257,7 @@ void alp_program( const size_t & unit, alp::RC & rc ) {
 	print_matrix( " input matrix T ", T );
 #endif
 
-  	rc = rc ? rc : algorithms::symm_tridiag_dac_eigensolver(
-		T,
-		Q,
-		d,
-		ring
-	);
+  	rc = rc ? rc : algorithms::symm_tridiag_dac_eigensolver( T, Q, d, ring );
 
 
 #ifdef DEBUG
@@ -294,15 +265,20 @@ void alp_program( const size_t & unit, alp::RC & rc ) {
 	print_matrix( " << T >> ", T );
 #endif
 
-// 	rc = check_overlap( Q );
-// 	if( rc != SUCCESS ) {
-// 		std::cout << "Error: mratrix Q is not orthogonal\n";
-// 	}
+	// the algorithm should return correct eigenvalues
+	// but for larger matrices (n>20) a more stable calculations
+	// of eigenvectors is needed
+	// therefore we disable numerical correctness check in this version
+
+	// rc = check_overlap( Q );
+	// if( rc != SUCCESS ) {
+	// 	std::cout << "Error: mratrix Q is not orthogonal\n";
+	// }
 
-// 	rc = check_solution( H, Q, T );
-// 	if( rc != SUCCESS ) {
-// 		std::cout << "Error: solution numerically wrong\n";
-// 	}
+	// rc = check_solution( T, Q, d );
+	// if( rc != SUCCESS ) {
+	// 	std::cout << "Error: solution numerically wrong\n";
+	// }
 }
 
 int main( int argc, char ** argv ) {

From b5ea85091b3fc90b5178c77f7ef7e0554e2a77c7 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Thu, 20 Oct 2022 14:42:07 +0200
Subject: [PATCH 08/14] replace for loop with ALP primitives

(fold Matrix -> vector is missing)
---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 52 +++++++++++++------
 1 file changed, 35 insertions(+), 17 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index f6d7d3888..4e7e387ed 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -252,23 +252,41 @@ namespace alp {
 			);
 			rc = rc ? rc : alp::set( egvals_non_direct, vec_temp_egvals );
 
-			// until fold vec -> matrix (or scatter) is implemented
-			// we have to use this for loop
-			for( size_t i = 0; i < nn; i++ ) {
-				auto egvecs_view = get_view( Egvecs_non_direct, utils::range( 0, nn ), i );
-				// //test
-				// alp::set( egvecs_view, Scalar< D >( i + 1 ) );
-				// //test
-
-				alp::set( egvecs_view, vec_temp_v );
-				alp::set( vec_temp_egvals, vec_temp_d );
-				Scalar< D > lambda_i( egvals_non_direct[ i ] );
-				rc = rc ? rc : alp::foldl( vec_temp_egvals, lambda_i , minus );
-				rc = rc ? rc : alp::foldl( egvecs_view, vec_temp_egvals , divide );
-				Scalar< D > norm1( zero );
-				rc = rc ? rc : norm2( norm1, egvecs_view, ring );
-				rc = rc ? rc : alp::foldl( egvecs_view, norm1 , divide );
-			}
+			Matrix< D, structures::General, Dense > tmp_egvecs( nn, nn );
+			Matrix< D, structures::General, Dense > tmp_denominator( nn, nn );
+
+			alp::Vector< D > ones( nn );
+			rc = rc ? rc : alp::set( ones, one );
+			rc = rc ? rc : alp::set(
+				tmp_egvecs,
+				alp::outer( vec_temp_v, ones, ring.getMultiplicativeOperator() )
+			);
+
+			auto ddd = alp::outer( vec_temp_d, ones, ring.getMultiplicativeOperator() );
+			auto lll = alp::outer( ones, egvals_non_direct, ring.getMultiplicativeOperator() );
+			rc = rc ? rc : alp::set( tmp_denominator, ddd );
+			rc = rc ? rc : alp::foldl( tmp_denominator, lll, minus );
+			rc = rc ? rc : alp::foldl( tmp_egvecs, tmp_denominator, divide );
+
+			// while fold matrix -> vector would be a solution to
+			// normalize columns in tmp_egvecs,
+			// here we abuse syntax and use eWiseLambda.
+			// Once fold matrix -> vector implemented, the next section should be rewritten
+			rc = rc ? rc : eWiseLambda(
+				[ &tmp_egvecs, &nn, &ring, &divide, &zero ]( const size_t i, D &val ) {
+					(void)val;
+					auto egvec_i = get_view( tmp_egvecs, utils::range( 0, nn ), i );
+					Scalar< D > norm_i( zero );
+					(void)norm2( norm_i, egvec_i, ring );
+					alp::foldl( egvec_i, norm_i , divide );
+				},
+				ones
+			);
+
+			// update results
+			auto egvecs_view = get_view( Egvecs_non_direct, utils::range( 0, nn ), utils::range( 0, nn ) );
+			auto tmp_egvecs_orth_view = get_view< OrthogonalType  >( tmp_egvecs );
+			rc = rc ? rc : alp::set( egvecs_view, tmp_egvecs_orth_view );
 
 			return rc;
 		}

From e3f0b09249786a9ec770e0c116cf7ac19f1f74f9 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Fri, 21 Oct 2022 10:21:47 +0200
Subject: [PATCH 09/14] comments

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 21 +++++++++----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 4e7e387ed..f6bd85caa 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -51,7 +51,8 @@ namespace alp {
 		RC bisec_sec_eq(
 			Scalar< D > &lambda,
 			const Vector<	D, structures::General,	Dense, VecView1, VecImfR1, VecImfC1 > &d,
-			// Vector v should be const, but that would disable eWiseLambda, to be resolved in the future
+			// Vector v should be const, but that would disable eWiseLambda,
+			// to be resolved in the future
 			Vector<	D, structures::General,	Dense, VecView2, VecImfR2, VecImfC2 > &v,
 			const Scalar< D > &a,
 			const Scalar< D > &b,
@@ -158,7 +159,9 @@ namespace alp {
 
 			std::vector< size_t > direct_egvc_indx( n, 0 );
 			std::vector< size_t > non_direct_egvc_indx( n, 0 );
-
+			// the following loop should be replaced by ALP primitives
+			// since v is not sorted it seems that another sort is needed
+			// currently there is no simple way to impement this in ALP
 			for( size_t i = 0; i < n; i++ ) {
 				if( std::abs( v[ i ] ) < eps ) {
 					// in these cases equals are canonical vectors
@@ -187,10 +190,6 @@ namespace alp {
 			auto egvals_direct = get_view< alp::structures::General >( egvals, select_direct );
 			auto egvals_non_direct = get_view< alp::structures::General >( egvals, select_non_direct );
 
-			// not needed as Q is alrady set to identity
-			// auto Egvecs_direct = alp::get_view< alp::structures::Orthogonal >(
-			// 	Egvecs, select_direct, select_direct
-			// );
 			auto Egvecs_non_direct = alp::get_view< alp::structures::Orthogonal >(
 				Egvecs, select_non_direct, select_non_direct
 			);
@@ -222,8 +221,8 @@ namespace alp {
 			rc = rc ? rc : alp::set( v3, v4 );
 
 			// eWiseLambda currently does not work with select view
-			// dot does not work with select view
-			// as a temp solutions we make temp vectors 
+			// dot() does not work with select view
+			// as a (temp) solution we use temp vectors
 			alp::Vector< D > vec_temp_egvals( nn );
 			alp::Vector< D > vec_temp_d( nn );
 			alp::Vector< D > vec_temp_v( nn );
@@ -233,13 +232,13 @@ namespace alp {
 			rc = rc ? rc : alp::set( vec_temp_v, v_view );
 
 			Scalar< D > alpha( zero );
-			//rc = rc ? rc : dot( alpha, d_view, d_view, ring ); // bug!
+			// there is a bug in dot() when called on select views
+			//rc = rc ? rc : dot( alpha, d_view, d_view, ring );
 			rc = rc ? rc : dot( alpha, vec_temp_v, vec_temp_v, ring );
 
 			auto v5 = get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
 			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
 
-
 			rc = rc ? rc : eWiseLambda(
 				[ &d_view, &vec_temp_v, &vec_b ]( const size_t i, D &val ) {
 					Scalar< D > a( d_view[ i ] );
@@ -270,7 +269,7 @@ namespace alp {
 
 			// while fold matrix -> vector would be a solution to
 			// normalize columns in tmp_egvecs,
-			// here we abuse syntax and use eWiseLambda.
+			// here we abuse the syntax and use eWiseLambda.
 			// Once fold matrix -> vector implemented, the next section should be rewritten
 			rc = rc ? rc : eWiseLambda(
 				[ &tmp_egvecs, &nn, &ring, &divide, &zero ]( const size_t i, D &val ) {

From a54cbdbaeca39ce5d27193e29820a3d720a7f3b8 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Fri, 21 Oct 2022 10:44:53 +0200
Subject: [PATCH 10/14] enable smoketest

---
 tests/smoke/CMakeLists.txt | 2 +-
 tests/smoke/smoketests.sh  | 7 +++++++
 2 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/tests/smoke/CMakeLists.txt b/tests/smoke/CMakeLists.txt
index 16200d0fc..c64dd42be 100644
--- a/tests/smoke/CMakeLists.txt
+++ b/tests/smoke/CMakeLists.txt
@@ -185,7 +185,7 @@ add_grb_executables( alp_zgeqrf_complex alp_zgeqrf.cpp
 	COMPILE_DEFINITIONS _COMPLEX
 )
 
-add_grb_executables( alp_stedc alp_stedc.cpp
+add_grb_executables( alp_dstedc alp_stedc.cpp
         BACKENDS alp_reference
 )
 
diff --git a/tests/smoke/smoketests.sh b/tests/smoke/smoketests.sh
index f2fab6b57..bf2e69cd6 100755
--- a/tests/smoke/smoketests.sh
+++ b/tests/smoke/smoketests.sh
@@ -571,6 +571,13 @@ for BACKEND in ${BACKENDS[@]}; do
 	grep 'Test OK' ${TEST_OUT_DIR}/alp_zgeqrf_complex_${BACKEND}.log || echo "Test FAILED"
 	echo " "
 
+	NTEST_DIVCON=100
+	echo ">>>      [x]           [ ]       Tests dstedc (Divide and conquer tridiagonal eigensolver) on"
+	echo ">>>                               a tridiagonal real symmetric matrix (${NTEST_DIVCON}x${NTEST_DIVCON})."
+	bash -c "$runner ${TEST_BIN_DIR}/alp_dstedc_${BACKEND} ${NTEST_DIVCON} &> ${TEST_OUT_DIR}/alp_dstedc_${BACKEND}.log"
+	head -1 ${TEST_OUT_DIR}/alp_dstedc_${BACKEND}.log
+	grep 'Test OK' ${TEST_OUT_DIR}/alp_dstedc_${BACKEND}.log || echo "Test FAILED"
+	echo " "
 	
 done
 

From c360f45fd617237f1e2abbcaf89e722f5fdc7490 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Fri, 21 Oct 2022 14:17:38 +0200
Subject: [PATCH 11/14] review

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 99 +++++++++----------
 include/alp/structures.hpp                    |  6 +-
 tests/smoke/alp_stedc.cpp                     | 23 +++--
 3 files changed, 63 insertions(+), 65 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index f6bd85caa..95158ecc2 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -34,7 +34,7 @@ namespace alp {
 		 * find zero of secular equation in interval <a,b>
 		 * using bisection
 		 * this is not an optimal algorithm and there are many
-		 * more efficient implantation
+		 * more efficient implementation
 		 */
 		template<
 			typename D,
@@ -78,10 +78,10 @@ namespace alp {
 				[ &d, &x0, &fx0, &ring, &minus, &divide ]( const size_t i, D &val ) {
 					Scalar< D > alpha( val );
 					Scalar< D > beta( d[ i ] );
-					foldl( alpha, Scalar< D > ( val ), ring.getMultiplicativeOperator() );
-					foldl( beta, x0, minus );
-					foldl( alpha, beta, divide );
-					foldl( fx0, alpha, ring.getAdditiveOperator() );
+					alp::foldl( alpha, Scalar< D > ( val ), ring.getMultiplicativeOperator() );
+					alp::foldl( beta, x0, minus );
+					alp::foldl( alpha, beta, divide );
+					alp::foldl( fx0, alpha, ring.getAdditiveOperator() );
 				},
 				v
 			);
@@ -102,13 +102,13 @@ namespace alp {
 
 
 		/**
-		 * Calcualte eigendecomposition of system D + vvt
+		 * Calculate eigendecomposition of system D + vvt
 		 *        \f$D = diag(d)$ is diagonal matrix and
 		 *        \a vvt outer product outer(v,v)
 		 *
 		 * @tparam D        Data element type
 		 * @tparam Ring     Type of the semiring used in the computation
-		 * @tparam Minus    Type minus operator used in the computation
+		 * @tparam Minus    Type of minus operator used in the computation
 		 * @tparam Divide   Type of divide operator used in the computation
 		 * @param[out] Egvecs    output orthogonal matrix contaning eigenvectors
 		 * @param[out] egvals    output vector containg eigenvalues
@@ -144,7 +144,6 @@ namespace alp {
 			const Minus &minus = Minus(),
 			const Divide &divide = Divide()
 		) {
-			(void)minus;
 			RC rc = SUCCESS;
 
 			const Scalar< D > zero( ring.template getZero< D >() );
@@ -187,8 +186,8 @@ namespace alp {
 			std::cout << " ---->     count_direct_egvc = " << count_direct_egvc << "\n";
 			std::cout << " ----> count_non_direct_egvc = " << count_non_direct_egvc << "\n";
 #endif
-			auto egvals_direct = get_view< alp::structures::General >( egvals, select_direct );
-			auto egvals_non_direct = get_view< alp::structures::General >( egvals, select_non_direct );
+			auto egvals_direct = alp::get_view< alp::structures::General >( egvals, select_direct );
+			auto egvals_non_direct = alp::get_view< alp::structures::General >( egvals, select_non_direct );
 
 			auto Egvecs_non_direct = alp::get_view< alp::structures::Orthogonal >(
 				Egvecs, select_non_direct, select_non_direct
@@ -200,8 +199,8 @@ namespace alp {
 				get_view< alp::structures::General >( d, select_direct )
 			);
 
-			auto d_view = get_view< alp::structures::General >( d, select_non_direct );
-			auto v_view = get_view< alp::structures::General >( v, select_non_direct );
+			auto d_view = alp::get_view< alp::structures::General >( d, select_non_direct );
+			auto v_view = alp::get_view< alp::structures::General >( v, select_non_direct );
 
 #ifdef DEBUG
 			print_vector( "eigensolveDiagPlusOuter: d ", d );
@@ -213,11 +212,11 @@ namespace alp {
 			// vec_b = {d_view[1], d_view[2], ... , d_view[N-1], d_view[N]+dot(v,v) }
 			size_t nn = alp::getLength( d_view );
 			alp::Vector< D > vec_b( nn );
-			auto v1 = get_view( vec_b, utils::range( 0, nn - 1 ) );
-			auto v2 = get_view( d_view, utils::range( 1, nn ) );
+			auto v1 = alp::get_view( vec_b, utils::range( 0, nn - 1 ) );
+			auto v2 = alp::get_view( d_view, utils::range( 1, nn ) );
 			rc = rc ? rc : alp::set( v1, v2 );
-			auto v3 = get_view( vec_b, utils::range( nn - 1, nn ) );
-			auto v4 = get_view( d_view, utils::range( nn - 1, nn ) );
+			auto v3 = alp::get_view( vec_b, utils::range( nn - 1, nn ) );
+			auto v4 = alp::get_view( d_view, utils::range( nn - 1, nn ) );
 			rc = rc ? rc : alp::set( v3, v4 );
 
 			// eWiseLambda currently does not work with select view
@@ -233,13 +232,13 @@ namespace alp {
 
 			Scalar< D > alpha( zero );
 			// there is a bug in dot() when called on select views
-			//rc = rc ? rc : dot( alpha, d_view, d_view, ring );
-			rc = rc ? rc : dot( alpha, vec_temp_v, vec_temp_v, ring );
+			//rc = rc ? rc : alp::dot( alpha, d_view, d_view, ring );
+			rc = rc ? rc : alp::dot( alpha, vec_temp_v, vec_temp_v, ring );
 
-			auto v5 = get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
+			auto v5 = alp::get_view( vec_b, utils::range( alp::getLength( vec_b ) - 1, alp::getLength( vec_b ) ) );
 			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
 
-			rc = rc ? rc : eWiseLambda(
+			rc = rc ? rc : alp::eWiseLambda(
 				[ &d_view, &vec_temp_v, &vec_b ]( const size_t i, D &val ) {
 					Scalar< D > a( d_view[ i ] );
 					Scalar< D > b( vec_b[ i ] );
@@ -271,20 +270,20 @@ namespace alp {
 			// normalize columns in tmp_egvecs,
 			// here we abuse the syntax and use eWiseLambda.
 			// Once fold matrix -> vector implemented, the next section should be rewritten
-			rc = rc ? rc : eWiseLambda(
+			rc = rc ? rc : alp::eWiseLambda(
 				[ &tmp_egvecs, &nn, &ring, &divide, &zero ]( const size_t i, D &val ) {
-					(void)val;
+					(void) val;
 					auto egvec_i = get_view( tmp_egvecs, utils::range( 0, nn ), i );
 					Scalar< D > norm_i( zero );
-					(void)norm2( norm_i, egvec_i, ring );
+					alp::norm2( norm_i, egvec_i, ring );
 					alp::foldl( egvec_i, norm_i , divide );
 				},
 				ones
 			);
 
 			// update results
-			auto egvecs_view = get_view( Egvecs_non_direct, utils::range( 0, nn ), utils::range( 0, nn ) );
-			auto tmp_egvecs_orth_view = get_view< OrthogonalType  >( tmp_egvecs );
+			auto egvecs_view = alp::get_view( Egvecs_non_direct, utils::range( 0, nn ), utils::range( 0, nn ) );
+			auto tmp_egvecs_orth_view = alp::get_view< OrthogonalType >( tmp_egvecs );
 			rc = rc ? rc : alp::set( egvecs_view, tmp_egvecs_orth_view );
 
 			return rc;
@@ -292,7 +291,7 @@ namespace alp {
 
 
 		/**
-		 * Calcualte eigendecomposition of symmetric tridiagonal matrix T
+		 * Calculate eigendecomposition of symmetric tridiagonal matrix T
 		 *        \f$T = Qdiag(d)Q^T\f$ where
 		 *        \a T is real symmetric tridiagonal
 		 *        \a Q is orthogonal (columns are eigenvectors).
@@ -300,7 +299,7 @@ namespace alp {
 		 *
 		 * @tparam D        Data element type
 		 * @tparam Ring     Type of the semiring used in the computation
-		 * @tparam Minus    Type minus operator used in the computation
+		 * @tparam Minus    Type of minus operator used in the computation
 		 * @tparam Divide   Type of divide operator used in the computation
 		 * @param[out] Q    output orthogonal matrix contaning eigenvectors
 		 * @param[out] d    output vector containg eigenvalues
@@ -351,13 +350,13 @@ namespace alp {
 				VecImfR,
 				VecImfC
 			> &d,
-			const Ring & ring = Ring(),
-			const Minus & minus = Minus(),
-			const Divide & divide = Divide()
+			const Ring &ring = Ring(),
+			const Minus &minus = Minus(),
+			const Divide &divide = Divide()
 		) {
-			(void)ring;
-			(void)minus;
-			(void)divide;
+			(void) ring;
+			(void) minus;
+			(void) divide;
 
 			const Scalar< D > zero( ring.template getZero< D >() );
 			const Scalar< D > one( ring.template getOne< D >() );
@@ -369,7 +368,7 @@ namespace alp {
 
 			if( n == 1 ) {
 				//d=T[0];
-				rc = rc ? rc : eWiseLambda(
+				rc = rc ? rc : alp::eWiseLambda(
 					[ &d ]( const size_t i, const size_t j, D &val ) {
 						(void) i;
 						(void) j;
@@ -385,13 +384,13 @@ namespace alp {
 
 
 			Vector< D, structures::General, Dense > v( n );
-			rc = rc ? rc : set( v, zero );
-			rc = rc ? rc : eWiseLambda(
+			rc = rc ? rc : alp::set( v, zero );
+			rc = rc ? rc : alp::eWiseLambda(
 				[ &T, &m, &ring ]( const size_t i, D &val ) {
-					if( i ==  m - 1 ) {
+					if( i == m - 1 ) {
 						val = ring.template getOne< D >();
 					}
-					if( i ==  m) {
+					if( i == m) {
 						val = internal::access( T, internal::getStorageIndex( T, m - 1, m ) );
 					}
 				},
@@ -413,8 +412,8 @@ namespace alp {
 			print_matrix( " Atmp(updated)  ", Atmp );
 #endif
 
-			auto Ttop = get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( 0, m ), utils::range( 0, m ) );
-			auto Tdown = get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( m, n ), utils::range( m, n ) );
+			auto Ttop = alp::get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( 0, m ), utils::range( 0, m ) );
+			auto Tdown = alp::get_view< SymmOrHermTridiagonalType >( Atmp, utils::range( m, n ), utils::range( m, n ) );
 
 #ifdef DEBUG
 			print_matrix( " Ttop = ", Ttop );
@@ -423,14 +422,14 @@ namespace alp {
 
 			Vector< D, structures::General, Dense > dtmp( n );
 			rc = rc ? rc : alp::set( dtmp, zero );
-			auto dtop = get_view( dtmp, utils::range( 0, m ) );
-			auto ddown = get_view( dtmp, utils::range( m, n ) );
+			auto dtop = alp::get_view( dtmp, utils::range( 0, m ) );
+			auto ddown = alp::get_view( dtmp, utils::range( m, n ) );
 
 			Matrix< D, OrthogonalType, Dense > U( n );
 			rc = rc ? rc : alp::set( U, zero );
 
-			auto Utop = get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
-			auto Udown = get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
+			auto Utop = alp::get_view< OrthogonalType >( U, utils::range( 0, m ), utils::range( 0, m ) );
+			auto Udown = alp::get_view< OrthogonalType >( U, utils::range( m, n ), utils::range( m, n ) );
 
 			rc = rc ? rc : symm_tridiag_dac_eigensolver( Ttop, Utop, dtop, ring );
 			rc = rc ? rc : symm_tridiag_dac_eigensolver( Tdown, Udown, ddown, ring );
@@ -454,9 +453,9 @@ namespace alp {
 #ifdef TEMPDISABLE
 			// while mxv does not support vectors/view
 			// we cast vector->matrix and use mxm
-			auto z_mat_view = get_view< view::matrix >( z );
-			auto v_mat_view = get_view< view::matrix >( v );
-			rc = rc ? rc : mxm(
+			auto z_mat_view = alp::get_view< view::matrix >( z );
+			auto v_mat_view = alp::get_view< view::matrix >( v );
+			rc = rc ? rc : alp::mxm(
 				z_mat_view,
 				alp::get_view< alp::view::transpose >( U ),
 				v_mat_view,
@@ -464,7 +463,7 @@ namespace alp {
 			);
 #else
 			//z=U^T.dot(v)
-			rc = rc ? rc : mxv(
+			rc = rc ? rc : alp::mxv(
 				z,
 				alp::get_view< alp::view::transpose >( U ),
 				v,
@@ -480,7 +479,7 @@ namespace alp {
 			// permutations which sort dtmp
 			std::vector< size_t > isort_dtmp( n, 0 );
 			std::vector< size_t > no_permute_data( n, 0 );
-			for( size_t i = 0 ; i < n ; ++i ) {
+			for( size_t i = 0; i < n; ++i ) {
 				isort_dtmp[ i ] = i;
 				no_permute_data[ i ] = i;
 			}
@@ -531,7 +530,7 @@ namespace alp {
 #endif
 
 			rc = rc ? rc : alp::set( Q, zero );
-			rc = rc ? rc : mxm( Q, U, QdOuter, ring	);
+			rc = rc ? rc : alp::mxm( Q, U, QdOuter, ring	);
 
 #ifdef DEBUG
 			print_matrix( "  Q = U x Q   ", Q );
diff --git a/include/alp/structures.hpp b/include/alp/structures.hpp
index 93a51662a..363e8e533 100644
--- a/include/alp/structures.hpp
+++ b/include/alp/structures.hpp
@@ -633,9 +633,9 @@ namespace alp {
 		struct isInstantiable< Orthogonal, Orthogonal > {
 			template< typename ImfR, typename ImfC >
 			static bool check( const ImfR &imf_r, const ImfC &imf_c ) {
-				// This chek has to further improved.
-				// Orthogonal matrix in the current implemenation
-				// means full-rank square othogonal matrix.
+				// This check has to be further improved.
+				// Orthogonal matrix in the current implementation
+				// means full-rank square orthogonal matrix.
 				// Rectangular matrix orthogonal only by rows (or columns)
 				// does not fit into the current Orthogonal structure.
 				return imf_r.n == imf_c.n ;
diff --git a/tests/smoke/alp_stedc.cpp b/tests/smoke/alp_stedc.cpp
index 0f6d9b6a5..09df2e8df 100644
--- a/tests/smoke/alp_stedc.cpp
+++ b/tests/smoke/alp_stedc.cpp
@@ -41,8 +41,8 @@ using HermitianOrSymmetric = structures::Symmetric;
 constexpr BaseScalarType tol = 1.e-5;
 constexpr size_t RNDSEED = 11235;
 
-//temp function untill (tridiagonal)Hermitian containter is implemented
-//** gnerate tridiagonal-symmetric-hermitian matrix in a rectangular container */
+//** temp function until (tridiagonal)Hermitian container is implemented */
+//** generate tridiagonal-symmetric-hermitian matrix in a rectangular container */
 template<
 	typename T
 >
@@ -54,8 +54,7 @@ std::vector< T > generate_symmherm_tridiag_matrix_data(
 	>::type * const = nullptr
 ) {
 	std::vector< T > data( N * N );
-	std::fill(data.begin(), data.end(), static_cast< T >( 0 ) );
-	std::srand( RNDSEED );
+	std::fill( data.begin(), data.end(), static_cast< T >( 0 ) );
 	for( size_t i = 0; i < N; ++i ) {
 		for( size_t j = i; ( j < N ) && ( j <= i + 1 ); ++j ) {
 			T val( std::rand(), std::rand() );
@@ -78,7 +77,6 @@ std::vector< T >  generate_symmherm_tridiag_matrix_data(
 	>::type * const = nullptr
 ) {
 	std::vector< T > data( N * N );
-	std::srand( RNDSEED );
 	for( size_t i = 0; i < N; ++i ) {
 		for( size_t j = i; ( j < N ) && ( j <= i + 1 ); ++j ) {
 			T val = static_cast< T >( std::rand() )  / RAND_MAX;
@@ -169,13 +167,13 @@ RC check_solution(
 	Matrix< D, SymmOrHermTridiagonalType, Dense, SymmHermTrdiViewType, SymmHermTrdiImfR, SymmHermTrdiImfC > &T,
 	Matrix<	D, OrthogonalType, Dense, OrthViewType, OrthViewImfR, OrthViewImfC > &Q,
 	Vector<	D, structures::General, Dense, VecViewType, VecImfR, VecImfC > &d,
-	const Ring & ring = Ring(),
-	const Minus & minus = Minus(),
-	const Divide & divide = Divide()
+	const Ring &ring = Ring(),
+	const Minus &minus = Minus(),
+	const Divide &divide = Divide()
 ) {
-	(void)ring;
-	(void)minus;
-	(void)divide;
+	(void) ring;
+	(void) minus;
+	(void) divide;
 	RC rc = SUCCESS;
 
  	const size_t n = nrows( Q );
@@ -231,7 +229,7 @@ RC check_solution(
 
 
 
-void alp_program( const size_t & unit, alp::RC & rc ) {
+void alp_program( const size_t &unit, alp::RC &rc ) {
 	rc = SUCCESS;
 
 	alp::Semiring<
@@ -250,6 +248,7 @@ void alp_program( const size_t & unit, alp::RC & rc ) {
 	Vector< ScalarType, structures::General, Dense > d( N );
 	rc = rc ? rc : set( d, zero_scalar );
 	{
+		std::srand( RNDSEED );
 		auto matrix_data = generate_symmherm_tridiag_matrix_data< ScalarType >( N );
 		rc = rc ? rc : alp::buildMatrix( T, matrix_data.begin(), matrix_data.end() );
 	}

From 97c1b64fb8a3ef5c1f76f3c17bb23d46a15e9de7 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Fri, 21 Oct 2022 17:07:16 +0200
Subject: [PATCH 12/14] review

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 36 +++++++++++--------
 1 file changed, 21 insertions(+), 15 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 95158ecc2..3de7358f9 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -65,9 +65,16 @@ namespace alp {
 
 			const Scalar< D > zero( ring.template getZero< D >() );
 			const Scalar< D > one( ring.template getOne< D >() );
-			Scalar< D > x0( ( *a + *b ) / ( 2 ) );
 
-			if( std::abs( *a - *b ) < tol ) {
+			Scalar< D > x0( a );
+			rc = rc ? rc : alp::foldl( x0, b, ring.getAdditiveOperator() );
+			rc = rc ? rc : alp::foldl( x0, Scalar< D >( 2 ), divide );
+
+			Scalar< D > delta( a );
+			rc = rc ? rc : alp::foldl( delta, b, minus );
+			*delta = std::abs( *delta );
+
+			if( *delta < tol ) {
 				alp::set( lambda, x0 );
 				return rc;
 			}
@@ -239,10 +246,12 @@ namespace alp {
 			rc = rc ? rc : alp::foldl( v5, alpha, ring.getAdditiveOperator() );
 
 			rc = rc ? rc : alp::eWiseLambda(
-				[ &d_view, &vec_temp_v, &vec_b ]( const size_t i, D &val ) {
+				[ &d_view, &vec_temp_v, &vec_b, &ring, &divide ]( const size_t i, D &val ) {
 					Scalar< D > a( d_view[ i ] );
 					Scalar< D > b( vec_b[ i ] );
-					Scalar< D > w( ( *a + *b ) / 2 );
+					Scalar< D > w( a );
+					alp::foldl( w, b, ring.getAdditiveOperator() );
+					alp::foldl( w, Scalar< D >( 2 ), divide );
 					bisec_sec_eq( w, d_view, vec_temp_v, a, b );
 					val = *w;
 				},
@@ -385,17 +394,14 @@ namespace alp {
 
 			Vector< D, structures::General, Dense > v( n );
 			rc = rc ? rc : alp::set( v, zero );
-			rc = rc ? rc : alp::eWiseLambda(
-				[ &T, &m, &ring ]( const size_t i, D &val ) {
-					if( i == m - 1 ) {
-						val = ring.template getOne< D >();
-					}
-					if( i == m) {
-						val = internal::access( T, internal::getStorageIndex( T, m - 1, m ) );
-					}
-				},
-				v
-			);
+
+			auto v1 = alp::get_view( T, utils::range( m - 1, m ), m );
+			auto v2 = alp::get_view( v, utils::range( m , m + 1 ) );
+			rc = rc ? rc : alp::set( v2, v1 );
+
+			auto v3 = alp::get_view( v, utils::range( m - 1 , m ) );
+			rc = rc ? rc : alp::set( v3, one );
+
 #ifdef DEBUG
 			print_vector( " v = ", v );
 #endif

From 44ad6c686cfebbe9836c26878b0b427af489f414 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Mon, 24 Oct 2022 10:51:13 +0200
Subject: [PATCH 13/14] review

---
 .../algorithms/symm_tridiag_eigensolver.hpp   | 54 +++++++++----------
 1 file changed, 25 insertions(+), 29 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 3de7358f9..4064054a0 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -38,22 +38,22 @@ namespace alp {
 		 */
 		template<
 			typename D,
-			typename VecView1,
-			typename VecImfR1,
-			typename VecImfC1,
-			typename VecView2,
-			typename VecImfR2,
-			typename VecImfC2,
+			typename VectorD,
+			typename VectorV,
 			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
 			class Minus = operators::subtract< D >,
-			class Divide = operators::divide< D >
+			class Divide = operators::divide< D >,
+			std::enable_if_t<
+				is_vector< VectorD >::value &&
+				is_vector< VectorV >::value
+			> * = nullptr
 		>
 		RC bisec_sec_eq(
 			Scalar< D > &lambda,
-			const Vector<	D, structures::General,	Dense, VecView1, VecImfR1, VecImfC1 > &d,
+			const VectorD &d,
 			// Vector v should be const, but that would disable eWiseLambda,
 			// to be resolved in the future
-			Vector<	D, structures::General,	Dense, VecView2, VecImfR2, VecImfC2 > &v,
+			VectorV &v,
 			const Scalar< D > &a,
 			const Scalar< D > &b,
 			const D tol = 1.e-10,
@@ -124,29 +124,25 @@ namespace alp {
 		 *
 		 */
 		template<
-			typename D,
-			typename VecView1,
-			typename VecImfR1,
-			typename VecImfC1,
-			typename VecView2,
-			typename VecImfR2,
-			typename VecImfC2,
-			typename VecView3,
-			typename VecImfR3,
-			typename VecImfC3,
-			typename OrthogonalType,
-			typename OrthViewType,
-			typename OrthViewImfR,
-			typename OrthViewImfC,
-			class Ring = Semiring< operators::add< D >, operators::mul< D >, identities::zero, identities::one >,
+			typename Vec1,
+			typename Vec2,
+			typename Vec3,
+			typename OrthogonalMat,
+			typename D = typename OrthogonalMat::value_type,
+			class Ring = Semiring<
+				operators::add< D >,
+				operators::mul< D >,
+				identities::zero,
+				identities::one
+			>,
 			class Minus = operators::subtract< D >,
 			class Divide = operators::divide< D >
 		>
 		RC eigensolveDiagPlusOuter(
-			Vector<	D, structures::General,	Dense, VecView1, VecImfR1, VecImfC1 > &egvals,
-			Matrix< D, OrthogonalType, Dense, OrthViewType, OrthViewImfR, OrthViewImfC > &Egvecs,
-			Vector<	D, structures::General, Dense, VecView2, VecImfR2, VecImfC2 > &d,
-			Vector< D, structures::General, Dense, VecView3, VecImfR3, VecImfC3 > &v,
+			Vec1 &egvals,
+			OrthogonalMat &Egvecs,
+			Vec2 &d,
+			Vec3 &v,
 			const Ring &ring = Ring(),
 			const Minus &minus = Minus(),
 			const Divide &divide = Divide()
@@ -292,7 +288,7 @@ namespace alp {
 
 			// update results
 			auto egvecs_view = alp::get_view( Egvecs_non_direct, utils::range( 0, nn ), utils::range( 0, nn ) );
-			auto tmp_egvecs_orth_view = alp::get_view< OrthogonalType >( tmp_egvecs );
+			auto tmp_egvecs_orth_view = alp::get_view< typename OrthogonalMat::structure >( tmp_egvecs );
 			rc = rc ? rc : alp::set( egvecs_view, tmp_egvecs_orth_view );
 
 			return rc;

From 8e0aeb63364b26da69c68ebbb96ce28a74688a96 Mon Sep 17 00:00:00 2001
From: Denis Jelovina <denis.jelovina@huawei.com>
Date: Mon, 24 Oct 2022 11:34:40 +0200
Subject: [PATCH 14/14] review

---
 include/alp/algorithms/symm_tridiag_eigensolver.hpp | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/include/alp/algorithms/symm_tridiag_eigensolver.hpp b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
index 4064054a0..f76d91fff 100644
--- a/include/alp/algorithms/symm_tridiag_eigensolver.hpp
+++ b/include/alp/algorithms/symm_tridiag_eigensolver.hpp
@@ -124,9 +124,9 @@ namespace alp {
 		 *
 		 */
 		template<
-			typename Vec1,
-			typename Vec2,
-			typename Vec3,
+			typename VectorEgVals,
+			typename VectorD,
+			typename VectorV,
 			typename OrthogonalMat,
 			typename D = typename OrthogonalMat::value_type,
 			class Ring = Semiring<
@@ -139,10 +139,10 @@ namespace alp {
 			class Divide = operators::divide< D >
 		>
 		RC eigensolveDiagPlusOuter(
-			Vec1 &egvals,
+			VectorEgVals &egvals,
 			OrthogonalMat &Egvecs,
-			Vec2 &d,
-			Vec3 &v,
+			VectorD &d,
+			VectorV &v,
 			const Ring &ring = Ring(),
 			const Minus &minus = Minus(),
 			const Divide &divide = Divide()