Program Listing for File matrix_continued_fraction.hpp¶

↰ Return to documentation for file (src_ed/matrix_continued_fraction.hpp)
#ifndef matrix_continued_fraction_h
#define matrix_continued_fraction_h

/*
 matrix_continued_fraction.hpp

 Matrix-valued continued fraction arising from the block Lanczos method.

 Scalar analogue: continued_fraction (see continued_fraction.hpp).

 A block Lanczos run with block size p and M steps produces:
   A[0..M-1]  -- p×p Hermitian diagonal blocks
   B[0..M-1]  -- p×p upper-triangular off-diagonal QR blocks

 These define a block-tridiagonal projected Hamiltonian T whose (0,0)
 block resolvent F_0(z) = [(zI - T)^{-1}]_{00} is evaluated via the
 backward recursion (matrix continued fraction):

   F_M = 0_{p×p}
   F_j = (zI - A_j - B_j^H F_{j+1} B_j)^{-1},   j = M-1 … 0

 where B_j (j < M-1) are the off-diagonal blocks stored in B; B[M-1] is
 the truncation residual and is not used in the recursion, in exact
 analogy with the last element of the b array in continued_fraction.

 If the starting block phi was not pre-orthonormalised before calling
 blockLanczos, an optional weight matrix W can be supplied so that the
 full projected Green function is  G(z) = W^H F_0(z) W.

 Usage:
   vector<matrix<HilbertField>> A, B;
   int M0 = 50;
   blockLanczos(H, phi, A, B, M0);
   matrix_continued_fraction<HilbertField> mcf(A, B);   // orthonormal starting block
   matrix<Complex> G = mcf.evaluate(z);
*/

#include "continued_fraction.hpp"   // pulls in block_matrix.hpp → matrix.hpp
// hdf5_io.hpp is already pulled in by continued_fraction.hpp
#include "Q_matrix.hpp"


template<typename T>
void mcf_polar_decompose(const matrix<T> &C, matrix<T> &W, matrix<T> &P)
{
    int p = (int)C.r;
    matrix<T> Ch(C);
    Ch.hermitian_conjugate();
    matrix<T> M(p);
    M.product(Ch, C);                   // M = C^H * C  (Hermitian PSD)

    vector<double> D(p);
    matrix<T> V(p);
    M.eigensystem(D, V);                // M = V * diag(D) * V^H, D >= 0

    double tol = global_double("accur_deflation");
    tol *= tol;

    P.set_size(p);
    matrix<T> Pinv(p);
    for(int r = 0; r < p; ++r){
        for(int c = 0; c < p; ++c){
            T s(0), si(0);
            for(int m = 0; m < p; ++m){
                double sq = sqrt(max(D[m], 0.0));
                T vc = V(r,m) * conjugate(V(c,m));
                s  += vc * T(sq);
                si += vc * T(D[m] > tol ? 1.0/sq : 0.0);
            }
            P(r,c) = s;
            Pinv(r,c) = si;
        }
    }
    W.set_size(p);
    W.product(C, Pinv);                 // W = C * P^{-1}
}

template<typename T>
void mcf_qr_decompose(const matrix<T> &C, matrix<T> &Q, matrix<T> &R)
{
    int p = (int)C.r;
    Q = C;
    R.set_size(p);
    for(int l = 0; l < p; ++l){
        for(int k = 0; k < l; ++k){
            T z(0);
            for(int i = 0; i < p; ++i) z += conjugate(Q(i,k)) * Q(i,l);
            R(k,l) = z;
            for(int i = 0; i < p; ++i) Q(i,l) -= z * Q(i,k);
        }
        double nrm2 = 0.0;
        for(int i = 0; i < p; ++i) nrm2 += realpart(conjugate(Q(i,l)) * Q(i,l));
        double nrm = sqrt(nrm2);
        R(l,l) = T(nrm);
        for(int i = 0; i < p; ++i) Q(i,l) *= T(1.0/nrm);
    }
}



template<typename T>
struct matrix_continued_fraction
{
    int p;
    vector<matrix<T>> A;
    vector<matrix<T>> B;
    matrix<Complex>   W;
    bool hermitian_B = false;

    matrix_continued_fraction() : p(0) {}


    matrix_continued_fraction(const vector<matrix<T>> &_A,
                               const vector<matrix<T>> &_B)
    {
        p = (int)_A[0].r;
        A = _A;
        B = _B;
        W.set_size(p);
        W.identity();
    }


    matrix_continued_fraction(const vector<matrix<T>> &_A,
                               const vector<matrix<T>> &_B,
                               double e0,
                               const matrix<T> &_W,
                               bool create)
    {
        p = (int)_A[0].r;
        A = _A;
        B = _B;
        for(size_t j = 0; j < A.size(); ++j){
            if(create) A[j] -= e0;            // A[j] -= e0 * I
            else {
                for(size_t r = 0; r < A[j].v.size(); ++r) A[j].v[r] = -A[j].v[r];
                A[j] += e0;                   // A[j] = e0*I - A[j]
            }
        }
        W = to_complex_matrix(_W);
    }


    matrix_continued_fraction(const vector<matrix<T>> &_A,
                               const vector<matrix<T>> &_B,
                               const matrix<Complex> &_W)
    {
        if(_A.empty()){ p = 0; return; }
        p = (int)_A[0].r;
        A = _A;
        B = _B;
        W = _W;
    }


    matrix<Complex> evaluate(Complex z) const
    {
        int M = (int)A.size();

        // F starts as the M-th floor: F_M = 0
        matrix<Complex> F(p, p);   // zero-initialised

        for(int j = M - 1; j >= 0; --j){

            // Σ = B[j]^H · F · B[j]  (only when j < M-1; otherwise Σ = 0)
            matrix<Complex> sigma(p, p);  // zero-initialised
            if(j < M - 1){
                matrix<Complex> Bj = to_complex_matrix(B[j]);
                // step 1: tmp = F · B[j]
                matrix<Complex> tmp(p);
                tmp.product(F, Bj);
                // step 2: sigma = B[j]^H · tmp
                matrix<Complex> Bjh(Bj);
                Bjh.hermitian_conjugate();
                sigma.product(Bjh, tmp);
            }

            // Build denominator D = z·I - A[j] - Σ
            matrix<Complex> D(p, p);    // zero
            D += z;                     // D = z·I
            D -= to_complex_matrix(A[j]);  // D = z·I - A[j]
            D -= sigma;                 // D = z·I - A[j] - Σ

            D.inverse();                // D  →  D^{-1}
            F = D;                      // F_{j} = D^{-1}
        }

        // Apply weight: G = W^H · F_0 · W
        // W may be non-square (p rows × q columns): result is q×q.
        int q = (int)W.c;
        matrix<Complex> tmp(p, q);
        tmp.product(F, W);              // tmp = F · W  (p × q)
        matrix<Complex> Wh(W);
        Wh.hermitian_conjugate();       // Wh  = W^H   (q × p)
        matrix<Complex> G(q, q);
        G.product(Wh, tmp);             // G   = W^H · F · W  (q × q)

        return G;
    }


    vector<T> apply(const vector<T>& x) const {
        int M = (int)A.size();
        vector<T> y(M * p, T(0));
        for(int j = 0; j < M; ++j){
            // diagonal: A[j] * x_j
            for(int col = 0; col < p; ++col)
                for(int row = 0; row < p; ++row)
                    y[j*p + row] += A[j](row, col) * x[j*p + col];
            // sub-diagonal: B[j-1] * x_{j-1}
            if(j > 0)
                for(int col = 0; col < p; ++col)
                    for(int row = 0; row < p; ++row)
                        y[j*p + row] += B[j-1](row, col) * x[(j-1)*p + col];
            // super-diagonal: B[j]^H * x_{j+1}  (B[M-1] not used)
            if(j < M-1)
                for(int col = 0; col < p; ++col)
                    for(int row = 0; row < p; ++row)
                        y[j*p + row] += conjugate(B[j](col, row)) * x[(j+1)*p + col];
        }
        return y;
    }


    matrix_continued_fraction<double> real() const {
        matrix_continued_fraction<double> result;
        result.p = p;
        result.A.resize(A.size());
        result.B.resize(B.size());
        for(size_t j = 0; j < A.size(); ++j) result.A[j] = to_real_matrix(A[j]);
        for(size_t j = 0; j < B.size(); ++j) result.B[j] = to_real_matrix(B[j]);
        result.W = to_complex_matrix(to_real_matrix(W));
        result.hermitian_B = hermitian_B;
        return result;
    }

    int floors() const { return (int)A.size(); }


    void convert_B_format()
    {
        int M = (int)A.size();
        if(M == 0){ hermitian_B = !hermitian_B; return; }

        matrix<T> G(p);
        G.identity();
        for(int j = 0; j < M; ++j){
            matrix<T> Gh(G);
            Gh.hermitian_conjugate();
            matrix<T> tmp(p);
            tmp.product(A[j], G);
            A[j].product(Gh, tmp);          // A[j] <- G^H * A[j] * G

            matrix<T> C(p);
            C.product(B[j], G);             // C = B[j] * G

            if(hermitian_B){
                matrix<T> Q, R;
                mcf_qr_decompose(C, Q, R);  // C = Q*R, R upper-triangular
                B[j] = R;
                G = Q;
            } else {
                matrix<T> Wp, P;
                mcf_polar_decompose(C, Wp, P);  // C = Wp*P, P Hermitian PSD
                B[j] = P;
                G = Wp;
            }
        }
        hermitian_B = !hermitian_B;
    }
};


// C++14-compatible helpers: convert a Complex scalar to field T.
inline double      mcf_to_T(Complex z, double)  { return z.real(); }
inline Complex     mcf_to_T(Complex z, Complex) { return z; }



template<typename T>
struct diagonal_hamiltonian {
    const vector<double>& evals;
    explicit diagonal_hamiltonian(const vector<double>& _e) : evals(_e) {}
    void mult_add(const vector<T>& x, vector<T>& y) const {
        for(size_t i = 0; i < evals.size(); ++i)
            y[i] += T(evals[i]) * x[i];
    }
};



template<typename HilbertField>
matrix_continued_fraction<HilbertField> Q_matrix_to_mcf(const Q_matrix<HilbertField>& Q)
{
    const int L = (int)Q.L;
    const int M = (int)Q.M;
    if(M == 0 || L == 0) return matrix_continued_fraction<HilbertField>();

    // Build starting block: phi[a] = row a of Q.v  (length-M vectors)
    vector<vector<HilbertField>> phi(L, vector<HilbertField>(M));
    for(int a = 0; a < L; ++a)
        for(int k = 0; k < M; ++k)
            phi[a][k] = Q.v(a, k);

    // Extract the upper-triangular QR factor W from phi via modified Gram-Schmidt.
    // The working copy q is discarded; blockLanczos re-orthonormalises phi internally.
    matrix<HilbertField> W(L);
    {
        vector<vector<HilbertField>> q(phi);
        for(int l = 0; l < L; ++l){
            for(int k = 0; k < l; ++k){
                HilbertField z = q[k] * q[l];
                W(k, l) = z;
                mult_add(-z, q[k], q[l]);
            }
            double nrm = norm(q[l]);
            W(l, l) = HilbertField(nrm);
            q[l] *= 1.0 / nrm;
        }
    }

    diagonal_hamiltonian<HilbertField> H(Q.e);
    vector<matrix<HilbertField>> A, B;
    int M0 = M;
    bool use_QR = global_bool("block_Lanczos_QR");
    if(use_QR)
        blockLanczos(H, phi, A, B, M0);
    else
        blockLanczosSVD(H, phi, A, B, M0);

    matrix_continued_fraction<HilbertField> mcf(A, B, to_complex_matrix(W));
    mcf.hermitian_B = !use_QR;
    return mcf;
}



template<typename T>
matrix_continued_fraction<T> combine_for_gf(
    const matrix_continued_fraction<T>& e,
    const matrix_continued_fraction<T>& h)
{
    const int pe = e.p, ph = h.p;
    QCM_ASSERT(pe == ph);
    QCM_ASSERT(e.hermitian_B == h.hermitian_B);
    const int p = pe + ph;
    const int Me = e.floors(), Mh = h.floors(), M = max(Me, Mh);

    // Direct-sum A and B blocks (identical to direct_sum())
    vector<matrix<T>> A(M), B(M);
    for(int j = 0; j < M; ++j){
        A[j] = matrix<T>(p, p);
        B[j] = matrix<T>(p, p);
        if(j < Me){
            e.A[j].move_sub_matrix(pe, pe, 0, 0, 0,  0,  A[j]);
            e.B[j].move_sub_matrix(pe, pe, 0, 0, 0,  0,  B[j]);
        }
        if(j < Mh){
            h.A[j].move_sub_matrix(ph, ph, 0, 0, pe, pe, A[j]);
            h.B[j].move_sub_matrix(ph, ph, 0, 0, pe, pe, B[j]);
        }
    }

    // Non-square weight W (2p × p): upper block = conj(W_e), lower block = W_h.
    matrix<Complex> W(p, pe);   // zero-initialised
    for(int k = 0; k < pe; ++k)
        for(int i = 0; i < pe; ++i)
            W(k, i) = conj(e.W(k, i));   // conj(W_e) in electron rows
    for(int k = 0; k < ph; ++k)
        for(int i = 0; i < ph; ++i)
            W(pe + k, i) = h.W(k, i);    // W_h in hole rows

    matrix_continued_fraction<T> mcf(A, B, W);
    mcf.hermitian_B = e.hermitian_B;
    return mcf;
}



template<typename T>
struct combined_sector_operator {
    const matrix_continued_fraction<T>& e;
    const matrix_continued_fraction<T>& h;
    const int Me, Mh, p;

    combined_sector_operator(const matrix_continued_fraction<T>& _e,
                              const matrix_continued_fraction<T>& _h)
        : e(_e), h(_h), Me(_e.floors()), Mh(_h.floors()), p(_e.p)
    { QCM_ASSERT(_e.p == _h.p); }

    void mult_add(const vector<T>& x, vector<T>& y) const {
        // e-sector: y_e += T_e * x_e
        vector<T> xe(x.begin(), x.begin() + Me * p);
        vector<T> ye = e.apply(xe);
        for(int i = 0; i < Me * p; ++i) y[i] += ye[i];

        // h-sector: y_h += T_h* x_h = conj(T_h conj(x_h))
        vector<T> xh(x.begin() + Me * p, x.end());
        for(auto& v : xh) v = conjugate(v);          // conjugate x_h
        vector<T> yh = h.apply(xh);                  // T_h * conj(x_h)
        for(int i = 0; i < Mh * p; ++i) y[Me * p + i] += conjugate(yh[i]);
    }
};



template<typename T>
matrix_continued_fraction<T> combine_via_lanczos(
    const matrix_continued_fraction<T>& e,
    const matrix_continued_fraction<T>& h,
    int M0)
{
    const int p  = e.p;
    QCM_ASSERT(e.p == h.p);
    const int Me = e.floors(), Mh = h.floors();
    const int N  = (Me + Mh) * p;  // total dimension of the combined space

    // Build starting block: p vectors of length N.
    // phi[i]: W_e[:,i]       at e-sector level 0 (positions 0..p-1)
    // phi[i]: conj(W_h[:,i]) at h-sector level 0 (positions Me*p .. Me*p+p-1)
    // The conjugate on the h-sector, combined with the T_h* operator, ensures
    // the h contribution to evaluate() gives (G⁻)ᵀ instead of G⁻.
    vector<vector<T>> phi(p, vector<T>(N, T(0)));
    for(int i = 0; i < p; ++i){
        for(int k = 0; k < p; ++k){
            phi[i][k]          = mcf_to_T(e.W(k, i),       T(0));  // W_e
            phi[i][Me * p + k] = mcf_to_T(conj(h.W(k, i)), T(0));  // conj(W_h)
        }
    }

    // Extract the upper-triangular QR factor W_new from phi via modified
    // Gram-Schmidt (mirrors the procedure in model_instance::build_mcf).
    matrix<T> W_new(p);
    {
        vector<vector<T>> q(phi);   // working copies
        for(int l = 0; l < p; ++l){
            for(int k = 0; k < l; ++k){
                T z = q[k] * q[l];   // inner product <q[k]|q[l]>
                W_new(k, l) = z;
                mult_add(-z, q[k], q[l]);
            }
            double nrm = norm(q[l]);
            W_new(l, l) = T(nrm);
            q[l] *= 1.0 / nrm;
        }
    }

    // Run block Lanczos on T_e ⊕ T_h with the p starting vectors.
    // block_Lanczos_QR=true (default) uses QR; false uses polar decomposition (Hermitian B).
    combined_sector_operator<T> op(e, h);
    vector<matrix<T>> A_new, B_new;
    bool use_QR = global_bool("block_Lanczos_QR");
    if(use_QR)
        blockLanczos(op, phi, A_new, B_new, M0);
    else
        blockLanczosSVD(op, phi, A_new, B_new, M0);

    matrix_continued_fraction<T> mcf(A_new, B_new, to_complex_matrix(W_new));
    mcf.hermitian_B = !use_QR;
    return mcf;
}


template<typename T>
std::ostream& operator<<(std::ostream& os, const matrix_continued_fraction<T>& F)
{
    int M = F.floors();
    os << "matrix_continued_fraction: p=" << F.p << "  floors=" << M
       << "  B=" << (F.hermitian_B ? "Hermitian" : "upper-triangular") << '\n';
    for(int j = 0; j < M; ++j){
        os << "A[" << j << "]:\n" << F.A[j];
    }
    for(int j = 0; j < (int)F.B.size(); ++j){
        os << "B[" << j << "]:\n" << F.B[j];
    }
    os << "W:\n" << F.W;
    return os;
}


template<typename T>
void h5_write_mcf(H5::Group& grp, const matrix_continued_fraction<T>& F)
{
    int M = F.floors();
    h5_write_attr(grp, "p",           F.p);
    h5_write_attr(grp, "floors",      M);
    h5_write_attr(grp, "hermitian_B", F.hermitian_B ? 1 : 0);
    for(int j = 0; j < M; ++j){
        H5::Group ag = grp.createGroup("A_" + to_string(j));
        h5_write_mat(ag, "data", F.A[j]);
    }
    for(int j = 0; j < (int)F.B.size(); ++j){
        H5::Group bg = grp.createGroup("B_" + to_string(j));
        h5_write_mat(bg, "data", F.B[j]);
    }
    H5::Group wg = grp.createGroup("W");
    h5_write_mat(wg, "data", F.W);
}


template<typename T>
void h5_read_mcf(H5::Group& grp, matrix_continued_fraction<T>& F)
{
    F.p   = h5_read_attr_int(grp, "p");
    int M = h5_read_attr_int(grp, "floors");
    // hermitian_B is absent in files written before this flag existed;
    // default to false (upper-triangular) for backward compatibility.
    F.hermitian_B = grp.attrExists("hermitian_B") && h5_read_attr_int(grp, "hermitian_B") != 0;
    F.A.resize(M);
    F.B.resize(M);
    for(int j = 0; j < M; ++j){
        H5::Group ag = grp.openGroup("A_" + to_string(j));
        h5_read_mat(ag, "data", F.A[j]);
    }
    for(int j = 0; j < M; ++j){
        H5::Group bg = grp.openGroup("B_" + to_string(j));
        h5_read_mat(bg, "data", F.B[j]);
    }
    H5::Group wg = grp.openGroup("W");
    h5_read_mat(wg, "data", F.W);
}


#endif