cosmotool/src/eskow.hpp

#ifndef __ESKOW_CHOLESKY_HPP
#define __ESKOW_CHOLESKY_HPP

#include <cmath>
#include <vector>
#include "mach.hpp"

/* Implementation of Schnabel & Eskow, 1999, Vol. 9, No. 4, pp. 1135-148, SIAM J. OPTIM. */

template<typename T, typename A>
class CholeskyEskow
{
private:
  static const bool verbose_eskow = true;
  T tau, tau_bar, mu;

  void print_matrix(A& m, int N)
  {
    using std::cout;
    using std::endl;
    using std::setprecision;

    if (verbose_eskow)
      {

	for (int i = 0; i < N; i++)
	  {
	    for (int j = 0; j < N; j++)
	      {
		cout.width(6);
		cout << setprecision(5) << m(i,j) << " ";
	      }
	    cout << endl;
	  }
	cout << endl;
      }
  }

  T max_diag(A& m, int j, int N)
  {
    T maxval = std::abs(m(j,j));

    for (int k = j+1; k < N; k++)
      {
	maxval = std::max(maxval, std::abs(m(k,k)));
      }
    return maxval;
  }

  void minmax_diag(A& m, int j, int N, T& minval, T& maxval, int& i_min, int& i_max)
  {
    i_min = i_max = j;
    minval = maxval = m(j,j);

    for (int k = j+1; k < N; k++)
      {
	maxval = std::max(maxval, m(k,k));
	minval = std::min(minval, m(k,k));
      }
  
    for (int k = j; k < N; k++)
      {
	if (m(k,k) == minval && i_min < 0)
	  i_min = k;
	if (m(k,k) == maxval && i_max < 0)
	  i_max = k;
      }
  }

  void swap_rows(A& m, int N, int i0, int i1)
  {
    for (int r = 0; r < N; r++)
      std::swap(m(r,i0), m(r,i1));
  }

  void swap_cols(A& m, int N, int i0, int i1)
  {
    for (int c = 0; c < N; c++)
      std::swap(m(i0,c), m(i1,c));
  }

  T square(T x)
  {
    return x*x;
  }

  T min_row(A& m, int j, int N)
  {
    T a = 1/m(j,j);
    T v = m(j+1,j+1) - square(m(j+1,j))*a;
    
    for (int i = j+2; i < N; i++)
      {
	v = std::min(v, m(i, i) - square(m(i,j))*a);
      }

    return v;
  }

  int g_max(const std::vector<T>& g, int j, int N)
  {
    T a = g[j];
    int k = j;

    for (int i = j+1; i < N; i++)
      {
	if (a < g[i])
	  {
	    a = g[i];
	    k = i;
	  }
      }
    return k;
  }

public:
  CholeskyEskow()
  {
    tau = std::pow(mach_epsilon<T>(), 1./3);
    tau_bar = std::pow(mach_epsilon<T>(), 2./3);
    mu=0.1;
  }

  void cholesky(A& m, int N, T& norm_E)
  {
    bool phaseone = true;
    T gamma = max_diag(m, 0, N);
    int j;

    norm_E = 0;
    
    for (j = 0; j < N && phaseone; j++)
      {
	T minval, maxval;
	int i_min, i_max;
	
	print_matrix(m, N);
     
	minmax_diag(m, j, N, minval, maxval, i_min, i_max);
	if (maxval < tau_bar*gamma || minval < -mu*maxval)
	  {
	    phaseone = false;
	    break;
	  }
      
	if (i_max != j)	  
	  {
	    std::cout << "Have to swap i=" << i_max << " and j=" << j << std::endl;
	    swap_cols(m, N, i_max, j);
	    swap_rows(m, N, i_max, j);

	  }
      
	if (min_row(m, j, N) < -mu*gamma)
	  {
	    phaseone = false;
	    break;
	  }
      
	T L_jj = std::sqrt(m(j,j));

	m(j,j) = L_jj;
	for (int i = j+1; i < N; i++)
	  {
	    m(i,j) /= L_jj;
	    for (int k = j+1; k <= i; k++)
	      m(i,k) -= m(i,j)*m(k,j);
	  }
      }


    if (!phaseone && j == N-1)
      {
	T A_nn = m(N-1,N-1);
	T delta = -A_nn + std::max(tau*(-A_nn)/(1-tau), tau_bar*gamma);
      
	m(N-1,N-1) = std::sqrt(m(N-1,N-1) + delta);	  	  
      }

    
    if (!phaseone && j < (N-1))
      {
	std::cout << "Phase two ! (j=" << j << ")" << std::endl;

	int k = j-1;
	std::vector<T> g(N);

	for (int i = k+1; i < N; i++)
	  {
	    g[i] = m(i,i);
	    for (int j = k+1; j < i; j++)
	      g[i] -= std::abs(m(i,j));
	    for (int j = i+1; j < N; j++)
	      g[i] -= std::abs(m(j,i));
	  }

	T delta, delta_prev = 0;
	
	for (int j = k+1; j < N-2; j++)
	  {
	    int i = g_max(g, j, N);
	    T norm_j;

	    print_matrix(m, N);

	    if (i != j)
	      {
		swap_cols(m, N, i, j);
		swap_rows(m, N, i, j);		
	      }


	    for (int i = j+1; j < N; j++)
	      {
		norm_j += std::abs(m(i,j));
	      }
	    
	    delta = std::max(delta_prev, std::max((T)0, -m(j,j) + std::max(norm_j,tau_bar*gamma)));
	    if (delta > 0)
	      {
		m(j,j) += delta;
		delta_prev = delta;
	      }
	    
	    if (m(j,j) != norm_j)
	      {
		T temp = 1 - norm_j/m(j,j);
		
		for (int i = j+1; j < N; j++)
		  {
		    g[i] += std::abs(m(i,j))*temp;
		  }
	      }

	    // Now we do the classic cholesky iteration
	    T L_jj = std::sqrt(m(j,j));
	    
	    m(j,j) = L_jj;
	    for (int i = j+1; i < N; i++)
	      {
		m(i,j) /= L_jj;
		for (int k = j+1; k <= i; k++)
		  m(i,k) -= m(i,j)*m(k,j);
	      }
	  }

	// The final 2x2 submatrix is special
	T A00 = m(N-2, N-2), A01 = m(N-2, N-1), A11 = m(N-1,N-1);
	T sq_DELTA = std::sqrt(square(A00-A11) + square(A01));
	T lambda_hi = 0.5*((A00+A11) + sq_DELTA);
	T lambda_lo = 0.5*((A00+A11) - sq_DELTA);
       
	delta = std::max(std::max((T)0, -lambda_lo + std::max(tau*sq_DELTA/(1-tau), tau_bar*gamma)),delta_prev);
	if (delta > 0)
	  {
	    m(N-1,N-1) += delta;
	    m(N,N) += delta;
	    delta_prev = delta;
	  }
	m(N-2,N-2) = A00 = std::sqrt(A00);
	m(N-1,N-2) = (A01 /= A00);
	m(N-1,N-1) = std::sqrt(A11-A01*A01);
	norm_E = delta_prev;
      }
  }

};


#endif
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`#ifndef __ESKOW_CHOLESKY_HPP`
			`#define __ESKOW_CHOLESKY_HPP`

			`#include <cmath>`
			`#include <vector>`
			`#include "mach.hpp"`

			`/* Implementation of Schnabel & Eskow, 1999, Vol. 9, No. 4, pp. 1135-148, SIAM J. OPTIM. */`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`template<typename T, typename A>`
			`class CholeskyEskow`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`private:`
			`static const bool verbose_eskow = true;`
			`T tau, tau_bar, mu;`

			`void print_matrix(A& m, int N)`
			`{`
			`using std::cout;`
			`using std::endl;`
			`using std::setprecision;`

			`if (verbose_eskow)`
			`{`

			`for (int i = 0; i < N; i++)`
			`{`
			`for (int j = 0; j < N; j++)`
			`{`
			`cout.width(6);`
			`cout << setprecision(5) << m(i,j) << " ";`
			`}`
			`cout << endl;`
			`}`
			`cout << endl;`
			`}`
			`}`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`T max_diag(A& m, int j, int N)`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`T maxval = std::abs(m(j,j));`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00
			`for (int k = j+1; k < N; k++)`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`maxval = std::max(maxval, std::abs(m(k,k)));`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`}`
			`return maxval;`
			`}`

			`void minmax_diag(A& m, int j, int N, T& minval, T& maxval, int& i_min, int& i_max)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`i_min = i_max = j;`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`minval = maxval = m(j,j);`

			`for (int k = j+1; k < N; k++)`
			`{`
			`maxval = std::max(maxval, m(k,k));`
			`minval = std::min(minval, m(k,k));`
			`}`

			`for (int k = j; k < N; k++)`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`if (m(k,k) == minval && i_min < 0)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`i_min = k;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`if (m(k,k) == maxval && i_max < 0)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`i_max = k;`
			`}`
			`}`

			`void swap_rows(A& m, int N, int i0, int i1)`
			`{`
			`for (int r = 0; r < N; r++)`
			`std::swap(m(r,i0), m(r,i1));`
			`}`

			`void swap_cols(A& m, int N, int i0, int i1)`
			`{`
			`for (int c = 0; c < N; c++)`
			`std::swap(m(i0,c), m(i1,c));`
			`}`

			`T square(T x)`
			`{`
			`return x*x;`
			`}`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`T min_row(A& m, int j, int N)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`T a = 1/m(j,j);`
			`T v = m(j+1,j+1) - square(m(j+1,j))*a;`

			`for (int i = j+2; i < N; i++)`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`v = std::min(v, m(i, i) - square(m(i,j))*a);`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`}`

			`return v;`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`}`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`int g_max(const std::vector<T>& g, int j, int N)`
			`{`
			`T a = g[j];`
			`int k = j;`

			`for (int i = j+1; i < N; i++)`
			`{`
			`if (a < g[i])`
			`{`
			`a = g[i];`
			`k = i;`
			`}`
			`}`
			`return k;`
			`}`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`public:`
			`CholeskyEskow()`
			`{`
			`tau = std::pow(mach_epsilon<T>(), 1./3);`
			`tau_bar = std::pow(mach_epsilon<T>(), 2./3);`
			`mu=0.1;`
			`}`

			`void cholesky(A& m, int N, T& norm_E)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
			`bool phaseone = true;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`T gamma = max_diag(m, 0, N);`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`int j;`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`norm_E = 0;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`for (j = 0; j < N && phaseone; j++)`
			`{`
			`T minval, maxval;`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`int i_min, i_max;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00
			`print_matrix(m, N);`

			`minmax_diag(m, j, N, minval, maxval, i_min, i_max);`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`if (maxval < tau_bargamma \|\| minval < -mumaxval)`
			`{`
			`phaseone = false;`
			`break;`
			`}`

Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`if (i_max != j)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`std::cout << "Have to swap i=" << i_max << " and j=" << j << std::endl;`
			`swap_cols(m, N, i_max, j);`
			`swap_rows(m, N, i_max, j);`

Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`}`

Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`if (min_row(m, j, N) < -mu*gamma)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`{`
			`phaseone = false;`
			`break;`
			`}`

			`T L_jj = std::sqrt(m(j,j));`

			`m(j,j) = L_jj;`
			`for (int i = j+1; i < N; i++)`
			`{`
			`m(i,j) /= L_jj;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`for (int k = j+1; k <= i; k++)`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`m(i,k) -= m(i,j)*m(k,j);`
			`}`
			`}`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`if (!phaseone && j == N-1)`
			`{`
			`T A_nn = m(N-1,N-1);`
			`T delta = -A_nn + std::max(tau(-A_nn)/(1-tau), tau_bargamma);`

			`m(N-1,N-1) = std::sqrt(m(N-1,N-1) + delta);`
			`}`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00


Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`if (!phaseone && j < (N-1))`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`std::cout << "Phase two ! (j=" << j << ")" << std::endl;`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`int k = j-1;`
			`std::vector<T> g(N);`

			`for (int i = k+1; i < N; i++)`
			`{`
			`g[i] = m(i,i);`
			`for (int j = k+1; j < i; j++)`
			`g[i] -= std::abs(m(i,j));`
			`for (int j = i+1; j < N; j++)`
			`g[i] -= std::abs(m(j,i));`
			`}`

			`T delta, delta_prev = 0;`

			`for (int j = k+1; j < N-2; j++)`
			`{`
			`int i = g_max(g, j, N);`
			`T norm_j;`

Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`print_matrix(m, N);`

Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`if (i != j)`
			`{`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`swap_cols(m, N, i, j);`
			`swap_rows(m, N, i, j);`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`}`

Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`for (int i = j+1; j < N; j++)`
			`{`
			`norm_j += std::abs(m(i,j));`
			`}`

			`delta = std::max(delta_prev, std::max((T)0, -m(j,j) + std::max(norm_j,tau_bar*gamma)));`
			`if (delta > 0)`
			`{`
			`m(j,j) += delta;`
			`delta_prev = delta;`
			`}`

			`if (m(j,j) != norm_j)`
			`{`
			`T temp = 1 - norm_j/m(j,j);`

			`for (int i = j+1; j < N; j++)`
			`{`
			`g[i] += std::abs(m(i,j))*temp;`
			`}`
			`}`

			`// Now we do the classic cholesky iteration`
			`T L_jj = std::sqrt(m(j,j));`

			`m(j,j) = L_jj;`
			`for (int i = j+1; i < N; i++)`
			`{`
			`m(i,j) /= L_jj;`
Fixed decomposition. Add sample matrix. 2011-12-14 17:40:10 -05:00			`for (int k = j+1; k <= i; k++)`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00			`m(i,k) -= m(i,j)*m(k,j);`
			`}`
			`}`

			`// The final 2x2 submatrix is special`
			`T A00 = m(N-2, N-2), A01 = m(N-2, N-1), A11 = m(N-1,N-1);`
			`T sq_DELTA = std::sqrt(square(A00-A11) + square(A01));`
			`T lambda_hi = 0.5*((A00+A11) + sq_DELTA);`
			`T lambda_lo = 0.5*((A00+A11) - sq_DELTA);`

			`delta = std::max(std::max((T)0, -lambda_lo + std::max(tausq_DELTA/(1-tau), tau_bargamma)),delta_prev);`
			`if (delta > 0)`
			`{`
			`m(N-1,N-1) += delta;`
			`m(N,N) += delta;`
			`delta_prev = delta;`
			`}`
			`m(N-2,N-2) = A00 = std::sqrt(A00);`
			`m(N-1,N-2) = (A01 /= A00);`
			`m(N-1,N-1) = std::sqrt(A11-A01*A01);`
			`norm_E = delta_prev;`
Incomplete implementatiof Eskow algorithm 2011-12-13 17:03:14 -05:00			`}`
			`}`

			`};`
Got a compiling version of the algorithm 2011-12-13 17:48:37 -05:00

			`#endif`