// Copyright (C) 2026 Kiyotsugu Arai // SPDX-License-Identifier: LGPL-3.0-or-later /** * @file iterative_solvers.hpp * @brief 反復法ソルバー API 拡充 * * 追加ソルバー: * - MINRES (対称不定行列用) * - FGMRES (可変前処理対応の Flexible GMRES) * * 統一 API: * - IterativeSolver : ビルダーパターンによるソルバー構成 * - SolverLog : 収束履歴の記録 * - solve() : 行列性質に基づく自動ソルバー選択 */ #ifndef CALX_ITERATIVE_SOLVERS_HPP #define CALX_ITERATIVE_SOLVERS_HPP #include

#include #include #include #include #include #include #include #include #include #include #include namespace calx {

namespace sparse_algorithms {

// ============================================================================
// SolverLog — 収束履歴の記録
// ============================================================================

template struct SolverLog {
    std::vector residual_history;  ///< 各反復の残差ノルム
    std::vector time_history;      ///< (将来用) 各反復の累積時間

    void clear() {
        residual_history.clear();
        time_history.clear();
    }

    void record(T rnorm) {
        residual_history.push_back(rnorm);
    }

    /// 収束率 (最後の数反復の幾何平均)
    [[nodiscard]] T convergence_rate(std::size_t window = 5) const {
        auto n = residual_history.size();
        if (n < 2) return T(1);
        auto w = std::min(window, n - 1);
        T ratio = residual_history[n - 1] / residual_history[n - 1 - w];
        return std::pow(std::abs(ratio), T(1) / static_cast (w));
    }
};

// ============================================================================
// MINRES — 対称不定行列用
// ============================================================================

/**
 * @brief MINRES (Minimum Residual Method)
 *
 * 対称 (不定可) 疎行列 A に対して Ax = b を解く。
 * CG が正定値を要求するのに対し、MINRES は不定行列にも使える。
 *
 * 実装: Lanczos 三重対角化 + GMRES 式 Givens QR
 * Lanczos で対称行列を三重対角化し、GMRES と同じ Givens 回転手順で
 * Hessenberg 上三角分解を行う。対称性から Hessenberg = 三重対角となり
 * 各列の回転が 1 回で済む (GMRES の j 回に対して定数回)。
 */
template requires concepts::OrderedField && std::integral SolverResult minres(
    const SparseMatrix & A,
    const Vector & b,
    const ConvergenceCriteria & criteria,
    Preconditioner precond = {},
    std::optional > x0 = std::nullopt,
    SolverLog * log = nullptr)
{
    const auto n = static_cast (A.rows());
    if (static_cast (A.cols()) != n)
        throw std::invalid_argument("MINRES: matrix must be square");
    if (b.size() != n)
        throw std::invalid_argument("MINRES: incompatible dimensions");

    (void)precond;

    Vector x = x0.value_or(Vector (n, T{0}));

    const T b_norm = norm(b);
    const T threshold = criteria.absolute_tolerance() +
                        criteria.relative_tolerance() * b_norm;

    // Lanczos + Givens QR (GMRES 方式を三重対角に特化)
    const std::size_t max_iter = std::min(criteria.max_iterations(), n);

    Vector r = b - A * x;
    T r_norm = norm(r);
    if (log) log->record(r_norm);
    if (r_norm <= threshold) {
        return {x, r_norm, 0, true};
    }

    // Lanczos 基底
    std::vector > Q(max_iter + 1);
    Q[0] = r / r_norm;

    // 三重対角行列を Hessenberg 形式で保持 (列ごとに 2 要素: H[j][j], H[j+1][j])
    // ただし Givens 回転適用前の値を保持するため、前の列も必要
    // → GMRES と同じ構造を使う (H は (m+1)×m だが三重対角なので帯幅 2)
    std::vector > H(max_iter + 1, std::vector (max_iter, T{0}));

    std::vector cs(max_iter, T{0}), sn(max_iter, T{0});
    std::vector g(max_iter + 1, T{0});
    g[0] = r_norm;

    Vector v_prev(n, T{0});
    std::size_t j = 0;
    for (; j < max_iter; ++j) {
        // Lanczos ステップ (= 対称行列の Arnoldi ステップ)
        Vector w = A * Q[j];

        // Modified Gram-Schmidt (対称性から j-1 と j のみ非ゼロ)
        if (j > 0) {
            H[j - 1][j] = dot(Q[j - 1], w);  // = beta_j (三重対角の上側)
            w -= Q[j - 1] * H[j - 1][j];
        }
        H[j][j] = dot(Q[j], w);  // = alpha_j
        w -= Q[j] * H[j][j];

        H[j + 1][j] = norm(w);  // = beta_{j+1}

        // Happy breakdown
        if (std::abs(H[j + 1][j]) < std::numeric_limits ::epsilon() * T{100}) {
            // Givens 回転を適用してから終了
            for (std::size_t i = 0; i < j; ++i) {
                T tmp = cs[i] * H[i][j] + sn[i] * H[i + 1][j];
                H[i + 1][j] = -sn[i] * H[i][j] + cs[i] * H[i + 1][j];
                H[i][j] = tmp;
            }
            T rr = std::sqrt(H[j][j] * H[j][j] + H[j + 1][j] * H[j + 1][j]);
            if (rr > T{0}) {
                cs[j] = H[j][j] / rr;
                sn[j] = H[j + 1][j] / rr;
                H[j][j] = rr;
                H[j + 1][j] = T{0};
                T g_new = -sn[j] * g[j];
                g[j] = cs[j] * g[j];
                g[j + 1] = g_new;
            }
            ++j;
            break;
        }

        Q[j + 1] = w / H[j + 1][j];

        // 以前の Givens 回転を H 列に適用 (三重対角 → G_{j-2} が fill-in を生むため最大 2 つ)
        for (std::size_t i = (j >= 2 ? j - 2 : 0); i < j; ++i) {
            T tmp = cs[i] * H[i][j] + sn[i] * H[i + 1][j];
            H[i + 1][j] = -sn[i] * H[i][j] + cs[i] * H[i + 1][j];
            H[i][j] = tmp;
        }

        // j 番目の Givens 回転
        T rr = std::sqrt(H[j][j] * H[j][j] + H[j + 1][j] * H[j + 1][j]);
        cs[j] = H[j][j] / rr;
        sn[j] = H[j + 1][j] / rr;
        H[j][j] = rr;
        H[j + 1][j] = T{0};

        T g_new = -sn[j] * g[j];
        g[j] = cs[j] * g[j];
        g[j + 1] = g_new;

        r_norm = std::abs(g[j + 1]);
        if (log) log->record(r_norm);

        if (r_norm <= threshold) {
            ++j;
            break;
        }
    }

    // 後退代入: R y = g
    const std::size_t dim = j;
    std::vector y(dim, T{0});
    for (std::size_t ii = 0; ii < dim; ++ii) {
        std::size_t idx = dim - 1 - ii;
        y[idx] = g[idx];
        for (std::size_t k = idx + 1; k < dim; ++k) {
            y[idx] -= H[idx][k] * y[k];
        }
        if (std::abs(H[idx][idx]) > std::numeric_limits ::epsilon()) {
            y[idx] /= H[idx][idx];
        }
    }

    // 解の更新: x += Q * y
    for (std::size_t k = 0; k < dim; ++k) {
        x += Q[k] * y[k];
    }

    T final_rnorm = norm(b - A * x);
    return {x, final_rnorm, dim, final_rnorm <= threshold};
}

// ============================================================================
// FGMRES — Flexible GMRES (可変前処理対応)
// ============================================================================

/**
 * @brief Flexible GMRES (可変前処理対応)
 *
 * 通常の GMRES では各反復で同一の前処理が必要だが、
 * FGMRES では反復ごとに異なる前処理を適用できる。
 * 前処理付き基底ベクトルを別途保持するため、メモリは 2 倍。
 *
 * 参考: Saad (1993), "A Flexible Inner-Outer Preconditioned GMRES Algorithm"
 */
template requires concepts::OrderedField && std::integral SolverResult fgmres(
    const SparseMatrix & A,
    const Vector & b,
    const ConvergenceCriteria & criteria,
    std::size_t restart = 30,
    Preconditioner precond = {},
    std::optional > x0 = std::nullopt,
    SolverLog * log = nullptr)
{
    const auto n = static_cast