initial upload

2024-09-10 20:04:47 +08:00 · 2024-09-10 20:04:47 +08:00 · b4b4275576
commit b4b4275576
parent 12b778cd3e
40 changed files with 8751 additions and 35 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,34 +1,3 @@
-# ---> C++
+.DS_Store
-# Prerequisites
+build/
-*.d
+.vscode/
 # Compiled Object files
 *.slo
 *.lo
 *.o
 *.obj
 # Precompiled Headers
 *.gch
 *.pch
 # Compiled Dynamic libraries
 *.so
 *.dylib
 *.dll
 # Fortran module files
 *.mod
 *.smod
 # Compiled Static libraries
 *.lai
 *.la
 *.a
 *.lib
 # Executables
 *.exe
 *.out
 *.app
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@ -0,0 +1,28 @@
 cmake_minimum_required(VERSION 3.15.2)
 # 设置项目名称与语言
 project(GCTL_OPTIMIZATION VERSION 1.0)
 # 添加配置配件编写的函数
 include(CMakePackageConfigHelpers)
 message(STATUS "Platform: " ${CMAKE_HOST_SYSTEM_NAME})
 message(STATUS "Install prefix: " ${CMAKE_INSTALL_PREFIX})
 message(STATUS "Processor: " ${CMAKE_HOST_SYSTEM_PROCESSOR})
 option(GCTL_OPTIMIZATION_TOML "Use the TOML library" ON)
 message(STATUS "[GCTL_OPTIMIZATION] Use the TOML library: " ${GCTL_OPTIMIZATION_TOML})
 find_package(GCTL REQUIRED)
 include_directories(${GCTL_INC_DIR})
 # 加入一个头文件配置，让cmake对源码进行操作
 configure_file(
 	"${PROJECT_SOURCE_DIR}/config.h.in"
 	"${PROJECT_SOURCE_DIR}/lib/optimization/gctl_optimization_config.h"
 	)
 # 添加库源文件地址
 add_subdirectory(lib)
 # 去掉注释编译示例
 add_subdirectory(example)
--- a/GCTL_OPTIMIZATIONConfig.cmake.in
+++ b/GCTL_OPTIMIZATIONConfig.cmake.in
@ -0,0 +1,25 @@
@PACKAGE_INIT@
 set(@PROJECT_NAME@_VERSION "@PROJECT_VERSION@")
 set_and_check(@PROJECT_NAME@_INSTALL_PREFIX "${PACKAGE_PREFIX_DIR}")
 set_and_check(@PROJECT_NAME@_INC_DIR "${PACKAGE_PREFIX_DIR}/include")
 set_and_check(@PROJECT_NAME@_INCLUDE_DIR "${PACKAGE_PREFIX_DIR}/include")
 set_and_check(@PROJECT_NAME@_LIB_DIR "${PACKAGE_PREFIX_DIR}/lib")
 set_and_check(@PROJECT_NAME@_LIBRARY_DIR "${PACKAGE_PREFIX_DIR}/lib")
 set(@PROJECT_NAME@_LIB gctl_optimization)
 set(@PROJECT_NAME@_LIBRARY gctl_optimization)
 set(@PROJECT_NAME@_TOML @GCTL_OPTIMIZATION_TOML@)
 message(STATUS "[GCTL_OPTIMIZATION] Use the TOML library: " @GCTL_OPTIMIZATION_TOML@)
 if(NOT GCTL_FOUND)
    find_package(GCTL REQUIRED)
    include_directories(${GCTL_INC_DIR})
 endif()
 # include target information
 include("${CMAKE_CURRENT_LIST_DIR}/@PROJECT_NAME@Targets.cmake")
 check_required_components(@PROJECT_NAME@)
--- a/README.md
+++ b/README.md
@ -1,2 +1,17 @@
-# gctl_optimization
+## lcg_solver 共轭梯度求解器
 ### 求解器参数设置
 #### 1. 从toml文件读取参数
 用户可以从toml文件中读取并设置求解器参数。所有的参数都定义在名为lcg的顶级表格下，可设置的参数及类型如下所示：
 ```toml
 [lcg]
 max_iterations=<int>
 epsilon=<float>
 abs_diff=0|1
 restart_epsilon=<float>
 step=<float>
 sigma=<float>
 beta=<float>
 maxi_m=<int>
 ```
--- a/config.h.in
+++ b/config.h.in
@ -0,0 +1 @@
 #cmakedefine GCTL_OPTIMIZATION_TOML
--- a/example/CMakeLists.txt
+++ b/example/CMakeLists.txt
@ -0,0 +1,20 @@
 set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O3")
 set(EXECUTABLE_OUTPUT_PATH ${PROJECT_BINARY_DIR}/bin/examples)
 macro(add_example name switch)
    if(${switch})
        add_executable(${name} ${name}.cpp)
        set_target_properties(${name} PROPERTIES CXX_STANDARD 17 CXX_STANDARD_REQUIRED ON)
        target_link_libraries(${name} PRIVATE ${GCTL_LIB})
        target_link_libraries(${name} PRIVATE gctl_optimization)
    endif()
 endmacro()
 add_example(ex1 ON)
 add_example(ex2 ON)
 add_example(ex3 ON)
 add_example(ex4 ON)
 add_example(ex5 ON)
 add_example(ex6 ON)
 add_example(ex7 ON)
 add_example(ex8 ON)
--- a/example/ex1.cpp
+++ b/example/ex1.cpp
@ -0,0 +1,164 @@
 /********************************************************
 *  ██████╗ ███████╗████████╗██╗     
 * ██╔════╝ ██╔════╝╚══██╔══╝██║     
 * ██║  ███╗███████╗   ██║   ██║     
 * ██║   ██║╚════██║   ██║   ██║     
 * ╚██████╔╝███████║   ██║   ███████╗
 *  ╚═════╝ ╚══════╝   ╚═╝   ╚══════╝                       
 * Generic Scientific Template Library
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * The GSTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License (LGPL) along with 
 * this program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GSTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GSTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "../lib/optimization.h"
 #define M 1000
 #define N 800
 double max_diff(const gctl::array<double> &a, const gctl::array<double> &b)
 {
 	double max = -1.0;
 	for (size_t i = 0; i < a.size(); i++)
 	{
 		max = std::max(sqrt((a[i] - b[i])*(a[i] - b[i])), max);
 	}
 	return max;
 }
 class ex1 : public gctl::lcg_solver
 {
 public:
 	ex1();
 	virtual ~ex1();
 	// 计算共轭梯度的B项
 	void cal_partb(const gctl::array<double> &x, gctl::array<double> &B);
 	//定义共轭梯度中Ax的算法
 	virtual void LCG_Ax(const gctl::array<double> &x, gctl::array<double> &ax);
 	virtual void LCG_Mx(const gctl::array<double> &x, gctl::array<double> &mx);
 private:
 	gctl::matrix<double> kernel; // 普通二维数组做核矩阵
 	gctl::array<double> tmp_arr; // 中间结果数组
 	gctl::array<double> p; // 预优矩阵
 };
 ex1::ex1()
 {
 	kernel.resize(M, N);
 	kernel.random(-1.0, 1.0, gctl::RdUniform);
 	tmp_arr.resize(M);
 	p.resize(N);
 	for (size_t i = 0; i < N; i++)
 	{
 		p[i] = 1.0;
 	}
 	double diag;
 	for (size_t i = 0; i < N; i++)
 	{
 		diag = 0.0;
 		for (size_t j = 0; j < M; j++)
 		{
 			diag += kernel[j][i]*kernel[j][i];
 		}
 		p[i] = 1.0/diag;
 	}
 }
 ex1::~ex1(){}
 void ex1::cal_partb(const gctl::array<double> &x, gctl::array<double> &B)
 {
 	LCG_Ax(x, B);
 	return;
 }
 void ex1::LCG_Ax(const gctl::array<double> &x, gctl::array<double> &ax)
 {
 	matvec(tmp_arr, kernel, x);
 	matvec(ax, kernel, tmp_arr, gctl::Trans);
 	return;
 }
 void ex1::LCG_Mx(const gctl::array<double> &x, gctl::array<double> &mx)
 {
 	vecmul(mx, p, x);
 	return;
 }
 int main(int argc, char const *argv[])
 {
 	// 生成一组正演解
 	gctl::array<double> fm(N);
 	gctl::random(fm, 1.0, 2.0, gctl::RdUniform);
 	ex1 test;
 	// 计算共轭梯度B项
 	gctl::array<double> B(N);
 	test.cal_partb(fm, B);
 	// 声明一组解
 	gctl::array<double> m(N, 0.0);
 	test.set_lcg_message(gctl::LCG_SOLUTION);
 	std::ofstream ofile("log.txt");
 	test.LCG_Minimize(m, B, gctl::LCG_CG, ofile);
 	ofile << "maximal difference: " << max_diff(fm, m) << std::endl;
 	m.assign_all(0.0);
 	test.LCG_Minimize(m, B, gctl::LCG_PCG, ofile);
 	ofile << "maximal difference: " << max_diff(fm, m) << std::endl;
 	m.assign_all(0.0);
 	test.LCG_Minimize(m, B, gctl::LCG_CGS, ofile);
 	ofile << "maximal difference: " << max_diff(fm, m) << std::endl;
 	ofile.close();
 	test.set_lcg_message(gctl::LCG_SOLUTION);
 	m.assign_all(0.0);
 	test.LCG_Minimize(m, B, gctl::LCG_BICGSTAB);
 	std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
 	m.assign_all(0.0);
 	test.LCG_Minimize(m, B, gctl::LCG_BICGSTAB2);
 	std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
 	gctl::array<double> low(N, 1.0);
 	gctl::array<double> hig(N, 2.0);
 	m.assign_all(0.0);
 	test.LCG_MinimizeConstrained(m, B, low, hig, gctl::LCG_PG);
 	std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
 	m.assign_all(0.0);
 	test.LCG_MinimizeConstrained(m, B, low, hig, gctl::LCG_SPG);
 	std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
 	return 0;
 }
--- a/example/ex2.cpp
+++ b/example/ex2.cpp
@ -0,0 +1,175 @@
 /********************************************************
 *  ██████╗ ███████╗████████╗██╗     
 * ██╔════╝ ██╔════╝╚══██╔══╝██║     
 * ██║  ███╗███████╗   ██║   ██║     
 * ██║   ██║╚════██║   ██║   ██║     
 * ╚██████╔╝███████║   ██║   ███████╗
 *  ╚═════╝ ╚══════╝   ╚═╝   ╚══════╝                       
 * Generic Scientific Template Library
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * The GSTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License (LGPL) along with 
 * this program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GSTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GSTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "../lib/optimization.h"
 #define M 100
 #define N 90
 // get random floating points
 double random_double(double l, double t)
 {
 	return (t-l)*rand()*1.0/RAND_MAX + l;
 }
 // get random integral numbers
 int random_int(int small, int big)
 {
 	return (rand() % (big - small)) + small;
 }
 class ex2 : public gctl::lgd_solver
 {
 protected:
    gctl::matrix<double> kernel;
    gctl::array<double> obs, tmp;
 protected:
    double LGD_Evaluate(const gctl::array<double> &x, gctl::array<double> &g);
 public:
    ex2();
    virtual ~ex2(){}
    void CalObs(const gctl::array<double> &x);
 };
 ex2::ex2()
 {
    kernel.resize(M, N);
    tmp.resize(M);
    obs.resize(M);
    srand(time(0));
 	// 添加一些大数
 	int tmp_id, tmp_size;
 	double tmp_val;
 	for (int i = 0; i < M; i++)
 	{
 		tmp_size = random_int(25, 35);
 		for (int j = 0; j < tmp_size; j++)
 		{
 			tmp_id = random_int(0, N);
 			tmp_val = random_double(-10, 10);
 			kernel[i][tmp_id] = tmp_val;
 		}
 	}
 }
 double ex2::LGD_Evaluate(const gctl::array<double> &x, gctl::array<double> &g)
 {
    for (int i = 0; i < M; i++)
    {
        tmp[i] = 0.0;
        for (int j = 0; j < N; j++)
        {
            tmp[i] += kernel[i][j] * x[j];
        }
        tmp[i] -= obs[i];
 		//tmp[i] /= 1e-1;
    }
 	for (int j = 0; j < N; j++)
 	{
        g[j] = 0.0;
        for (int i = 0; i < M; i++)
        {
            g[j] += kernel[i][j]*tmp[i];
        }
 		g[j] *= 2.0/M;
 	}
    double sum = 0.0;
    for (int i = 0; i < M; i++)
    {
        sum += tmp[i]*tmp[i];
    }
 	return sum/M;
 }
 void ex2::CalObs(const gctl::array<double> &x)
 {
    // 计算正演值
 	for (int i = 0; i < M; i++)
 	{
 		obs[i] = 0.0;
 		for (int j = 0; j < N; j++)
 		{
 			obs[i] += kernel[i][j]*x[j];
 		}
 		// 添加噪声
 		obs[i] += random_double(-1e-3, 1e-3);
 	}
 }
 int main(int argc, char const *argv[])
 {
    gctl::array<double> m(N, 0.0), mean_m(N, 0.0), stddev_m(N, 0.0), low(N), hig(N);
    // 生成一组正演解 包含一些大值和一些小值
 	gctl::array<double> fm(N);
 	int N2 = (int) N/2;
 	for (int i = 0; i < N2; i++)
 	{
 		//fm[i] = random_double(5, 10);
 		fm[i] = 10.0;
 	}
 	for (int i = N2; i < N; i++)
 	{
 		//fm[i] = random_double(1, 2);
 		fm[i] = 1.0;
 	}
 	for (int i = 0; i < N2; i++)
 	{
 		low[i] = 9.0; // 对解的范围进行约束
 		hig[i] = 11.0;
 	}
 	for (int i = N2; i < N; i++)
 	{
 		low[i] = 0.0;
 		hig[i] = 2.0;
 	}
    ex2 e;
    e.CalObs(fm);
 	gctl::lgd_para my_para = e.default_lgd_para();
 	my_para.flight_times = 20000;
 	my_para.batch = 100;
    e.set_lgd_para(my_para);
    e.LGD_Minimize(m, mean_m, stddev_m, low, hig);
 	for (int i = 0; i < N; i++)
 	{
 		std::cout << fm[i] << " " << m[i] << " " << mean_m[i] << " " << stddev_m[i] << " " << fabs(mean_m[i] - fm[i]) << std::endl;
 	}
 	return 0;
 }
--- a/example/ex3.cpp
+++ b/example/ex3.cpp
@ -0,0 +1,69 @@
 #include "../lib/optimization.h"
 class TEST_FUNC : public gctl::lbfgs_solver
 {
 public:
 	TEST_FUNC();
 	~TEST_FUNC();
 	virtual double LBFGS_Evaluate(const gctl::array<double> &x, gctl::array<double> &g);
 	void Routine();
 private:
 	gctl::array<double> m_x;
 };
 TEST_FUNC::TEST_FUNC()
 {
 	m_x.resize(3, 0.0);
 }
 TEST_FUNC::~TEST_FUNC(){}
 // test functions
 // 3 = 3*x1 + x2 + 2*x3*x3
 // 1 = -3*x1 + 5*x2*x2 + 2*x1*x3
 // -12 = 25*x1*x2 + 20*x3
 double TEST_FUNC::LBFGS_Evaluate(const gctl::array<double> &x, gctl::array<double> &g)
 {
 	double f0,f1,f2,temp;
 	f0 = 3*x[0] + x[1] + 2*x[2]*x[2] - 3.012; //这里添加一点噪声
 	f1 = -3*x[0] + 5*x[1]*x[1] + 2*x[0]*x[2] - 1.04252;
 	f2 = 25*x[0]*x[1] + 20*x[2] + 12.12479;
 	temp = sqrt(f0*f0+f1*f1+f2*f2);
 	g[0] = 0.5*(6*f0+2*f1*(2*x[2]-3)+50*f2*x[1])/temp;
 	g[1] = 0.5*(2*f0+20*f1*x[1]+50*f2*x[0])/temp;
 	g[2] = 0.5*(8*f0*x[2]+4*f1*x[0]+40*f2)/temp;
 	return temp;
 }
 void TEST_FUNC::Routine()
 {
 	gctl::lbfgs_para self_para = default_lbfgs_para();
 	self_para.m = 10;
 	self_para.past = 5;
 	self_para.residual = 1e-10;
 	//self_para.min_step = 1e-30;
 	//self_para.max_linesearch = 40;
 	//self_para.linesearch = gctl::LBFGS_LINESEARCH_BACKTRACKING_WOLFE;
 	set_lbfgs_para(self_para);
 	std::ofstream ofile("log.txt");
 	show_lbfgs_para(ofile);
 	double fx = LBFGS_Minimize(m_x, ofile);
 	ofile.close();
 	m_x.show();
 	return;
 }
 int main(int argc, char const *argv[])
 {
 	TEST_FUNC test;
 	test.Routine();
 	return 0;
 }
--- a/example/ex4.cpp
+++ b/example/ex4.cpp
@ -0,0 +1,91 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "../lib/optimization.h"
 #include "iostream"
 #include "iomanip"
 using std::cout;
 using std::endl;
 using std::setw;
 int main(int argc, char const *argv[])
 {
 	gctl::matrix<double> A(4, 3);
 	for (int i = 0; i < A.row_size(); i++)
 	{
 		for (int j = 0; j < A.col_size(); j++)
 		{
 			A[i][j] = 3*(i+1) + j - 2;
 		}
 	}
 	A[3][1] = 1;
 	cout<<"A(" << A.row_size() << ", " << A.col_size() << ") = " <<endl;
 	A.show();
 	gctl::svd svdd;
 	svdd.decompose(A);
 	cout<<"U(" << svdd.U.row_size() << ", " << svdd.U.col_size() << ") = " <<endl;
 	svdd.U.show();
 	cout<<"S(" << svdd.S.size() << ") = " << endl;
 	svdd.S.show();
 	cout<<"V(" << svdd.V.row_size() << ", " << svdd.V.col_size() << ") = " <<endl;
 	svdd.V.show();
 	int sig_num = svdd.get_singular_number();
 	double tmp_d;
 	gctl::array<double> tmp(sig_num);
 	cout<<"U^T * S * V(" << A.row_size() << ", " << A.col_size() << ") = " <<endl;
 	for(int i=0;i<A.row_size();i++)
 	{
 		for (int k = 0; k < sig_num; k++)
 		{
 			tmp[k] = svdd.U[k][i] * svdd.S[k];
 		}
 		for(int j=0;j<A.col_size();j++)
 		{
 			tmp_d = 0.0;
 			for (int k = 0; k < sig_num; k++)
 			{
 				tmp_d += tmp[k] * svdd.V[k][j];
 			}
 			cout<<setw(12)<<tmp_d<<' ';
 		}
 		cout<<endl;
 	}
 	cout<<endl;
 	return 0;
 }
--- a/example/ex5.cpp
+++ b/example/ex5.cpp
@ -0,0 +1,78 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "../lib/optimization.h"
 int main(int argc, char const *argv[])
 {
 	gctl::matrix<double> A(5, 5);
 	for (int i = 0; i < 5; i++)
 	{
 		for (int j = 0; j < 5; j++)
 		{
 			A[i][j] = 3*(i+1) + j - 2;
 		}
 	}
 	// 注意A要满秩
    A[1][2] = 3.4;
    A[4][1] = 2.1;
    A[3][4] = 9.7;
 	A[2][3] = 2.7;
 	std::cout<<"A(5, 5) = " <<std::endl;
 	for(int i=0;i<5;i++){
 		for(int j=0;j<5;j++){
 			std::cout<<A[i][j]<<' ';
 		}
 		std::cout<<std::endl;
 	}
 	std::cout<<std::endl;
    gctl::array<double> m(5, 0.5), x(5, 0.0);
    gctl::array<double> B(5);
    for (int i = 0; i < 5; i++)
 	{
        B[i] = 0.0;
 		for (int j = 0; j < 5; j++)
 		{
 			B[i] += A[i][j] * m[j];
 		}
 	}
 	gctl::lu glu(A);
 	glu.decompose();
    glu.solve(B, x);
    for (size_t i = 0; i < 5; i++)
    {
        std::cout << m[i] << " " << x[i] << std::endl;
    }
 	return 0;
 }
--- a/example/ex6.cpp
+++ b/example/ex6.cpp
@ -0,0 +1,90 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "../lib/optimization.h"
 // get random floating points
 double random_double(double l, double t)
 {
 	return (t-l)*rand()*1.0/RAND_MAX + l;
 }
 int main(int argc, char const *argv[])
 {
 	srand(time(0));
 	gctl::matrix<double> A(5, 5);
 	for (int i = 0; i < 5; i++)
 	{
 		for (int j = i; j < 5; j++)
 		{
 			if (i == j) A[i][j] = random_double(1.0, 3.0);
 			else A[i][j] = random_double(0.1, 1.0);
 		}
 	}
 	for (int i = 0; i < 5; i++)
 	{
 		for (int j = i; j < 5; j++)
 		{
 			A[j][i] = A[i][j];
 		}
 	}
 	std::cout<<"A(5, 5) = " <<std::endl;
 	for(int i=0;i<5;i++){
 		for(int j=0;j<5;j++){
 			std::cout<<A[i][j]<<' ';
 		}
 		std::cout<<std::endl;
 	}
 	std::cout<<std::endl;
    gctl::array<double> m(5, 0.5), x(5, 0.0);
    gctl::array<double> B(5);
    for (int i = 0; i < 5; i++)
 	{
        B[i] = 0.0;
 		for (int j = 0; j < 5; j++)
 		{
 			B[i] += A[i][j] * m[j];
 		}
 	}
 	gctl::cholesky gck(A);
 	gck.decompose();
    gck.solve(B, x);
    for (size_t i = 0; i < 5; i++)
    {
        std::cout << m[i] << " " << x[i] << std::endl;
    }
 	return 0;
 }
--- a/example/ex7.cpp
+++ b/example/ex7.cpp
@ -0,0 +1,124 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "../lib/optimization.h"
 typedef gctl::array<std::complex<double>> cd_array;
 #define N 1000
 double max_diff(const cd_array &a, const cd_array &b)
 {
 	double max = -1;
 	std::complex<double> t;
 	for (size_t i = 0; i < a.size(); i++)
 	{
 		t = a[i] - b[i];
 		max = std::max(std::norm(t), max);
 	}
 	return max;
 }
 class ex7 : public gctl::clcg_solver
 {
 public:
    ex7();
    virtual ~ex7();
 	virtual void CLCG_Ax(const cd_array &x, cd_array &ax, gctl::matrix_layout_e layout, gctl::conjugate_type_e conj);
    // 计算共轭梯度的B项
 	void cal_partb(const cd_array &x, cd_array &B);
 private:
    gctl::matrix<std::complex<double>> kernel; // 普通二维数组做核矩阵
 };
 ex7::ex7()
 {
    gctl::array<double> tmp(round(0.5*(N+1)*N));
    gctl::random(tmp, 1.0, 2.0, gctl::RdUniform);
    size_t c = 0;
    kernel.resize(N, N);
    for (int i = 0; i < N; i++)
 	{
 		for (int j = i; j < N; j++)
 		{
            kernel[i][j] = tmp[c];
 			kernel[j][i] = kernel[i][j];
            c++;
 		}
 	}
 }
 ex7::~ex7(){}
 void ex7::cal_partb(const cd_array &x, cd_array &B)
 {
    gctl::matvec(B, kernel, x);
    return;
 }
 void ex7::CLCG_Ax(const cd_array &x, cd_array &ax, gctl::matrix_layout_e layout, gctl::conjugate_type_e conj)
 {
    gctl::matvec(ax, kernel, x, layout, conj);
    return;
 }
 int main(int argc, char const *argv[])
 {
 	// 生成一组正演解
    gctl::array<double> tmp(2*N);
    gctl::random(tmp, 1.0, 2.0, gctl::RdUniform);
    cd_array fm(N);
    for (size_t i = 0; i < N; i++)
    {
        fm[i].real(tmp[2*i]);
        fm[i].imag(tmp[2*i + 1]);
    }
    ex7 test;
 	// 计算共轭梯度B项
    cd_array B(N);
    test.cal_partb(fm, B);
 	// 声明一组解
 	cd_array m(N, std::complex<double>(0.0, 0.0));
    gctl::clcg_para my_para = test.default_clcg_para();
    my_para.abs_diff = 1;
    test.set_clcg_para(my_para);
    test.CLCG_Minimize(m, B, gctl::CLCG_BICG_SYM);
    std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
 	return 0;
 }
--- a/example/ex8.cpp
+++ b/example/ex8.cpp
@ -0,0 +1,233 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "../lib/optimization.h"
 #define M 1000
 #define N 900
 // get random floating points
 double random_double(double l, double t)
 {
 	return (t-l)*rand()*1.0/RAND_MAX + l;
 }
 // get random integral numbers
 int random_int(int small, int big)
 {
 	return (rand() % (big - small)) + small;
 }
 double max_diff(const gctl::_1d_array &a, const gctl::_1d_array &b)
 {
 	double max = -1.0;
 	for (size_t i = 0; i < a.size(); i++)
 	{
 		max = std::max(fabs(a[i] - b[i]), max);
 	}
 	return max;
 }
 class ex8 : public gctl::lbfgs_solver, public gctl::grad_norm
 {
 public:
    ex8();
    virtual ~ex8();
    virtual double LBFGS_Evaluate(const gctl::_1d_array &x, gctl::_1d_array &g);
    virtual int LBFGS_Progress(const gctl::_1d_array &x, const gctl::_1d_array &g, const double fx, 
        const double converge, const double rate, const gctl::lbfgs_para param, int k, int ls, std::ostream &ss);
    void CalTarget(const gctl::_1d_array &x);
 private:
    gctl::_1d_array obs1, obs2, obs3, tmp, grad;
    gctl::_2d_matrix k1, k2, k3;
 };
 ex8::ex8()
 {
    srand(time(0));
    tmp.resize(M);
 	grad.resize(N);
    k1.resize(M, N);
    obs1.resize(M);
 	// 添加一些大数
 	int tmp_id, tmp_size;
 	double tmp_val;
 	for (int i = 0; i < M; i++)
 	{
 		tmp_size = random_int(25, 35);
 		for (int j = 0; j < tmp_size; j++)
 		{
 			tmp_id = random_int(0, N);
 			tmp_val = random_double(-1.0, 1.0);
 			k1[i][tmp_id] = tmp_val;
 		}
 	}
    k2.resize(M, N);
    obs2.resize(M);
 	// 添加一些大数
 	for (int i = 0; i < M; i++)
 	{
 		tmp_size = random_int(25, 35);
 		for (int j = 0; j < tmp_size; j++)
 		{
 			tmp_id = random_int(0, N);
 			tmp_val = random_double(-200.0, 200.0);
 			k2[i][tmp_id] = tmp_val;
 		}
 	}
    k3.resize(M, N);
    obs3.resize(M);
 	// 添加一些大数
 	for (int i = 0; i < M; i++)
 	{
 		tmp_size = random_int(25, 35);
 		for (int j = 0; j < tmp_size; j++)
 		{
 			tmp_id = random_int(0, N);
 			tmp_val = random_double(-0.01, 0.01);
 			k3[i][tmp_id] = tmp_val;
 		}
 	}
 }
 ex8::~ex8(){}
 double ex8::LBFGS_Evaluate(const gctl::_1d_array &x, gctl::_1d_array &g)
 {
    gctl::matvec(tmp, k1, x);
    tmp -= obs1;
    gctl::matvec(grad, k1, tmp, gctl::Trans);
    gctl::scale(grad, 2.0/M);
    AddSingleLoss(gctl::power2(gctl::module(tmp, gctl::L2))/M, grad);
    gctl::matvec(tmp, k2, x);
    tmp -= obs2;
    gctl::matvec(grad, k2, tmp, gctl::Trans);
    gctl::scale(grad, 2.0/M);
   	AddSingleLoss(gctl::power2(gctl::module(tmp, gctl::L2))/M, grad);
    gctl::matvec(tmp, k3, x);
    tmp -= obs3;
    gctl::matvec(grad, k3, tmp, gctl::Trans);
    gctl::scale(grad, 2.0/M);
    AddSingleLoss(gctl::power2(gctl::module(tmp, gctl::L2))/M, grad);
    return GradNormLoss(g);
 }
 int ex8::LBFGS_Progress(const gctl::_1d_array &x, const gctl::_1d_array &g, const double fx, 
    const double converge, const double rate, const gctl::lbfgs_para param, int k, int ls, std::ostream &ss)
 {
    UpdateWeights();
    return gctl::lbfgs_solver::LBFGS_Progress(x, g, fx, converge, rate, param, k, ls, ss);
 }
 void ex8::CalTarget(const gctl::_1d_array &x)
 {
    // 计算正演值
    gctl::matvec(obs1, k1, x);
 	for (int i = 0; i < M; i++)
 	{
 		// 添加噪声
 		obs1[i] += random_double(-1e-3, 1e-3);
 	}
    gctl::matvec(obs2, k2, x);
 	for (int i = 0; i < M; i++)
 	{
 		// 添加噪声
 		obs2[i] += random_double(-1e-3, 1e-3);
 	}
    gctl::matvec(obs3, k3, x);
 	for (int i = 0; i < M; i++)
 	{
 		// 添加噪声
 		obs3[i] += random_double(-1e-3, 1e-3);
 	}
    return;
 }
 int main(int argc, char const *argv[])
 {
 	// 生成一组正演解
    gctl::_1d_array fm(N);
    random(fm, 1.0, 2.0, gctl::RdUniform);
    ex8 test;
 	// 计算拟合目标项
    test.CalTarget(fm);
 	// 声明一组解
 	gctl::_1d_array m(N, 0.0);
    gctl::lbfgs_para self_para = test.default_lbfgs_para();
    self_para.linesearch = gctl::LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE;
 	self_para.epsilon = 1e-6;
 	test.set_lbfgs_para(self_para);
 	test.show_lbfgs_para();
    test.InitGradNorm(3, N);
    test.set_control_weight(1.0);
    test.set_weight_step(0.00001);
 	double fx = test.LBFGS_Minimize(m);
    std::clog << "maximal difference: " << max_diff(fm, m) << std::endl;
    gctl::_1d_array records;
    test.get_records(records);
    for (size_t i = 0; i < records.size(); i++)
    {
        if ((i+1)%3 == 0)
        {
            std::cout << records[i] << "\n";
        }
        else std::cout << records[i] << " ";
    }
 	return 0;
 }
--- a/54
+++ b/54
@ -0,0 +1,54 @@
 #!/bin/bash
 if [[ $# == 0 || ${1} == "help" ]]; then
 	echo "Compiles executables/libraries and maintains installed files. Two tools 'Cmake' and 'stow' are empolyed here. For more information, see https://cmake.org and https://www.gnu.org/software/stow/."
 	echo ""
 	echo "School of Earth Sciences, Zhejiang University"
 	echo "Yi Zhang (yizhang-geo@zju.edu.cn)"
 	echo ""
 	echo "Usage: ./installer [option] [Cmake options]"
 	echo ""
 	echo "Options:"
 	echo "(1) configure: Configure Cmake project(s). This option could take extra Cmake options as in <option>=<value>."
 	echo "(2)     build: Build executables/libraries."
 	echo "(3)   install: Install executables/libraries to the directory of CMAKE_INSTALL_PREFIX and sym-links them to the target address. This offers a quick and clean remove of the installed files."
 	echo "(4)     clean: Clean build/ folder(s)."
 	echo "(5) uninstall: Delete the installed files and sym-links."
 	echo "(6)      info: Print out current setups."
 	echo "(7)      help: Show help information."
 	exit 0
 fi
 package=gctl_optimization
 address=/opt/stow
 taress=/usr/local
 option="-DCMAKE_BUILD_TYPE=Release -DCMAKE_INSTALL_PREFIX=${address}/${package}"
 if [[ $# -gt 1 ]]; then
 	for opt in "$@"; do
 		if [[ ${opt} != "configure" ]]; then
 			option="${option} -D${opt}"
 		fi
 	done
 fi
 if [[ ${1} == "configure" && ! -d "build/" ]]; then
 	mkdir build && cd build && cmake .. ${option}
 elif [[ ${1} == "configure" ]]; then
 	cd build && rm -rf * && cmake .. ${option}
 elif [[ ${1} == "build" ]]; then
 	cd build && make
 elif [[ ${1} == "install" ]]; then
 	cd build && sudo make install
 	sudo stow --dir=${address} --target=${taress} -S ${package}
 elif [[ ${1} == "clean" ]]; then
 	rm -rf build/
 elif [[ ${1} == "uninstall" ]]; then
 	sudo stow --dir=${address} --target=${taress} -D ${package}
 	sudo rm -rf ${address}/${package}
 elif [[ ${1} == "info" ]]; then
 	echo "package name:" ${package}
 	echo "stow address:" ${address}
 	echo "target address:" ${taress}
 	echo "Cmake options:" ${option}
 fi
--- a/lib/CMakeLists.txt
+++ b/lib/CMakeLists.txt
@ -0,0 +1,64 @@
 # 设置编译选项
 set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -O3")
 set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O3")
 # 设置库文件的输出地址
 set(LIBRARY_OUTPUT_PATH ${PROJECT_BINARY_DIR}/lib)
 # 设定库源文件文件夹
 aux_source_directory(optimization/ GCTL_OPTIMAL_SRC)
 # 以下部分为库的编译
 # 注意目标名必须唯一 所以不能直接生成相同名称的动态库与静态库
 # 注意此处不必为目标名称添加lib前缀和相应后缀，cmake会自行添加
 add_library(gctl_optimization SHARED ${GCTL_OPTIMAL_SRC})
 # 首先添加静态库的生成命令
 add_library(gctl_optimization_static STATIC ${GCTL_OPTIMAL_SRC})
 # 设置静态库的输出名称从而获得与动态库名称相同的静态库
 set_target_properties(gctl_optimization_static PROPERTIES OUTPUT_NAME "gctl_optimization")
 # 设置输出目标属性以同时输出动态库与静态库
 set_target_properties(gctl_optimization PROPERTIES CLEAN_DIRECT_OUTPUT 1)
 set_target_properties(gctl_optimization_static PROPERTIES CLEAN_DIRECT_OUTPUT 1)
 # 设置动态库的版本号
 set_target_properties(gctl_optimization PROPERTIES VERSION ${PROJECT_VERSION} SOVERSION ${PROJECT_VERSION_MAJOR}.${PROJECT_VERSION_MINOR})
 # 设置动态库的运行搜索地址
 set_target_properties(gctl_optimization PROPERTIES INSTALL_RPATH /usr/local/lib)
 set_target_properties(gctl_optimization_static PROPERTIES INSTALL_RPATH /usr/local/lib)
 set_target_properties(gctl_optimization PROPERTIES CXX_STANDARD 17 CXX_STANDARD_REQUIRED ON)
 set_target_properties(gctl_optimization_static PROPERTIES CXX_STANDARD 17 CXX_STANDARD_REQUIRED ON)
 #连接动态库
 target_link_libraries(gctl_optimization PUBLIC ${GCTL_LIB})
 target_link_libraries(gctl_optimization_static ${GCTL_LIB})
 set(CONFIG_FILE_PATH lib/cmake/${PROJECT_NAME})
 configure_package_config_file(${PROJECT_SOURCE_DIR}/${PROJECT_NAME}Config.cmake.in 
 	${CMAKE_BINARY_DIR}/${PROJECT_NAME}Config.cmake
 	INSTALL_DESTINATION ${CONFIG_FILE_PATH})
 write_basic_package_version_file(${CMAKE_BINARY_DIR}/${PROJECT_NAME}ConfigVersion.cmake
 	VERSION ${PROJECT_VERSION}
 	COMPATIBILITY SameMajorVersion)
 # 库的安装命令
 if(WIN32)
 	install(TARGETS gctl_optimization DESTINATION lib)
 	install(TARGETS gctl_optimization_static DESTINATION lib)
 else()
 	install(TARGETS gctl_optimization gctl_optimization_static
 		EXPORT ${PROJECT_NAME}Targets
 		LIBRARY DESTINATION lib
 		ARCHIVE DESTINATION lib)
 	install(EXPORT ${PROJECT_NAME}Targets
 		DESTINATION ${CONFIG_FILE_PATH})
 	install(FILES
 		${CMAKE_BINARY_DIR}/${PROJECT_NAME}Config.cmake
 		${CMAKE_BINARY_DIR}/${PROJECT_NAME}ConfigVersion.cmake
 		DESTINATION ${CONFIG_FILE_PATH})
 endif()
 # 头文件安装命令
 file(GLOB GCTL_HEAD *.h)
 file(GLOB GCTL_OPTIMAL_HEAD optimization/*.h)
 install(FILES ${GCTL_HEAD} DESTINATION include/gctl)
 install(FILES ${GCTL_OPTIMAL_HEAD} DESTINATION include/gctl/optimization)
--- a/lib/optimization.h
+++ b/lib/optimization.h
@ -0,0 +1,43 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_OPTIMIZATION_H
 #define _GCTL_OPTIMIZATION_H
 #include "optimization/loss_func.h"
 #include "optimization/lu.h"
 #include "optimization/cholesky.h"
 #include "optimization/svd.h"
 #include "optimization/lcg.h"
 #include "optimization/clcg.h"
 #include "optimization/lgd.h"
 #include "optimization/lbfgs.h"
 #include "optimization/sgd.h"
 #include "optimization/gradnorm.h"
 #include "optimization/dwa.h"
 #endif // _GCTL_OPTIMIZATION_H
--- a/lib/optimization/cholesky.cpp
+++ b/lib/optimization/cholesky.cpp
@ -0,0 +1,127 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "cholesky.h"
 // Constructor
 gctl::cholesky::cholesky(matrix<double> &sourceMatrix) : decomposedMatrix(sourceMatrix)
 {
    if (sourceMatrix.empty() || sourceMatrix.row_size() != sourceMatrix.col_size())
    {
        throw domain_error("Invalid input matrix. From cholesky::cholesky(...)");
    }
 }
 // Decomposition into triangular matrices
 void gctl::cholesky::decompose()
 {
    // Enumerate matrix columnwise
    for (int j = 0; j < decomposedMatrix.col_size(); j++)
    {
        for (int i = j; i < decomposedMatrix.row_size(); i++)
        {
            if (i == j)
            {
                double sum = 0.0;
                for (int k = 0; k < i; k++)
                {
                    sum += std::pow(decomposedMatrix[i][k], 2.0);
                }
                if (decomposedMatrix[i][j] - sum <= 0.0)
                {
                    // Not positive definite matrix
                    throw runtime_error("The input matrix is not positively defined. From gctl::cholesky::decompose()");
                    return;
                }
                decomposedMatrix[i][j] = std::sqrt(decomposedMatrix[i][j] - sum);
            }
            else
            {
                double sum = 0.0;
                for (int k = 0; k < j; k++)
                {
                    sum += (decomposedMatrix[i][k] * decomposedMatrix[j][k]);
                }
                decomposedMatrix[i][j] = (1 / decomposedMatrix[j][j]) * (decomposedMatrix[i][j] - sum);
                decomposedMatrix[j][i] = decomposedMatrix[i][j];
            }
        }
    }
    return;
 }
 // Solve for x in form Ax = b.  A is the original input matrix.
 void gctl::cholesky::solve(const array<double>& b, array<double> &x)
 {
    if (b.empty())
    {
        throw domain_error("Invalid target vector. From lu<double>::solve(...)");
    }
    x.resize(b.size());
    // First solve lower triangular * x = b with forward substitution
    for (int i = 0; i < b.size(); i++)
    {
        double sum = 0.0;
        for (int j = 0; j < i; j++)
        {
            sum += (decomposedMatrix[i][j] * x[j]);
        }
        x[i] = (b[i] - sum) / decomposedMatrix[i][i];
    }
    // Now solve upper triangular (transpose of lower triangular) * x = x with back substitution.
    // Note that x can be solved in place using the existing x vector.  No need to allocate 
    // another vector.
    for (int i = static_cast<int>(b.size()) - 1; i >= 0; i--)
    {
        double sum = 0.0;
        for (int j = static_cast<int>(b.size()) - 1; j > i; j--)
        {
            sum += (decomposedMatrix[i][j] * x[j]);
        }
        x[i] = (x[i] - sum) / decomposedMatrix[i][i];
    }
    return;
 }
--- a/lib/optimization/cholesky.h
+++ b/lib/optimization/cholesky.h
@ -0,0 +1,55 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _CHOLESKY_H
 #define _CHOLESKY_H
 #include "gctl/core.h"
 namespace gctl
 {
    /**
     * @brief      Cholesky matrix decomposition to lower triangular matrix and its conjugate transpose
     * 
     * @note       Restricted to positive-definite matrices
     */
    class cholesky
    {
    public:
        cholesky(matrix<double> &sourceMatrix); // Matrix is decomposed in-place
        virtual ~cholesky(){}
        void decompose(); ///< Decomposition into triangular matrices.
        void solve(const array<double>& b, array<double> &x); ///< Solve for x in form Ax = b.  A is the original input matrix.
    protected:
        cholesky(const gctl::cholesky&) = delete;
        void operator=(const gctl::cholesky&) = delete;
        matrix<double> &decomposedMatrix;
    };
 }
 #endif // _CHOLESKY_H
--- a/lib/optimization/clcg.cpp
+++ b/lib/optimization/clcg.cpp
@ -0,0 +1,373 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "clcg.h"
 /**
 * Default parameter for conjugate gradient methods
 */
 static const gctl::clcg_para clcg_defparam = {0, 1e-8, 0};
 int gctl::clcg_solver::CLCG_Progress(const array<std::complex<double> > &m, const double converge, const clcg_para &param, size_t t)
 {
    if (converge <= param.epsilon)
    {
        std::clog << GCTL_CLEARLINE << "\rIteration-times: " << t << "\tconvergence: " << converge;
        return 0;
    }
    if (clcg_inter_ > 0 && t%clcg_inter_ == 0)
    {
        std::clog << GCTL_CLEARLINE << "\rIteration-times: " << t << "\tconvergence: " << converge;
    }
    return 0;
 }
 gctl::clcg_solver::clcg_solver()
 {
    clcg_param_ = clcg_defparam;
    clcg_inter_ = 1;
    clcg_silent_ = false;
 }
 gctl::clcg_solver::~clcg_solver(){}
 void gctl::clcg_solver::clcg_silent()
 {
    clcg_silent_ = true;
    return;
 }
 void gctl::clcg_solver::set_clcg_report_interval(size_t inter)
 {
    clcg_inter_ = inter;
    return;
 }
 void gctl::clcg_solver::set_clcg_para(const clcg_para &in_param)
 {
    clcg_param_ = in_param;
    return;
 }
 void gctl::clcg_solver::set_clcg_para(const toml::value &toml_data)
 {
    clcg_param_ = clcg_defparam;
    std::string CLCG = "clcg";
 	if (toml_data.contains(CLCG))
 	{
 		if (toml_data.at(CLCG).contains("max_iterations")) clcg_param_.max_iterations = toml::find<int>(toml_data, CLCG, "max_iterations");
 		if (toml_data.at(CLCG).contains("epsilon"))        clcg_param_.epsilon = toml::find<double>(toml_data, CLCG, "epsilon");
        if (toml_data.at(CLCG).contains("abs_diff"))       clcg_param_.abs_diff = toml::find<int>(toml_data, CLCG, "abs_diff");
 	}
    return;
 }
 void gctl::clcg_solver::clcg_error_str(clcg_return_code err_code, std::ostream &ss, bool err_throw)
 {
 #if defined _WINDOWS || __WIN32__
    if (!er_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_GREEN);
            ss << "Success! ";
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_RED);
            ss << "Fail! ";
        }
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[1m\033[32mCLCG Success! ";
        else
            ss << "\033[1m\033[31mCLCG Fail! ";
    }
 #endif
    std::string err_str;
    switch (err_code)
 	{
 		case CLCG_SUCCESS:
 			err_str = "Iteration reached convergence."; break;
 		case CLCG_STOP:
 			err_str = "Iteration is stopped by the progress evaluation function."; break;
 		case CLCG_ALREADY_OPTIMIZIED:
 			err_str = "The variables are already optimized."; break;
 		case CLCG_UNKNOWN_ERROR:
 			err_str = "Unknown error."; break;
 		case CLCG_INVILAD_VARIABLE_SIZE:
 			err_str = "The size of the variables is negative."; break;
 		case CLCG_INVILAD_MAX_ITERATIONS:
 			err_str = "The maximal iteration times is negative."; break;
 		case CLCG_INVILAD_EPSILON:
 			err_str = "The epsilon is not in the range (0, 1)."; break;
 		case CLCG_REACHED_MAX_ITERATIONS:
 			err_str = "The maximal iteration has been reached."; break;
 		case CLCG_NAN_VALUE:
 			err_str = "The model values are NaN."; break;
 		case CLCG_INVALID_POINTER:
 			err_str = "Invalid pointer."; break;
 		case CLCG_SIZE_NOT_MATCH:
 			err_str = "The sizes of the solution and target do not match."; break;
 		case CLCG_UNKNOWN_SOLVER:
 			err_str = "Unknown solver."; break;
 		default:
 			err_str = "Unknown error."; break;
 	}
    if (err_throw && err_code < 0) throw std::runtime_error(err_str.c_str());
    else ss << err_str;
 #if defined _WINDOWS || __WIN32__
    if (!er_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }	
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[0m" << std::endl;
        else
            ss << "\033[0m" << std::endl;	
    }
 #endif
    return;
 }
 gctl::clcg_para gctl::clcg_solver::default_clcg_para()
 {
    clcg_para dp = clcg_defparam;
    return dp;
 }
 void gctl::clcg_solver::CLCG_Minimize(array<std::complex<double> > &m, const array<std::complex<double> > &B, 
    clcg_solver_type solver_id, std::ostream &ss, bool verbose, bool er_throw)
 {
 	if (clcg_silent_)
    {
        clcg_return_code ret;
        if (solver_id == CLCG_BICG) ret = clbicg(m, B);
        else if (solver_id == CLCG_BICG_SYM) ret = clbicg_symmetric(m, B);
        else if (solver_id == CLCG_CGS) ret = clcgs(m, B);
        else if (solver_id == CLCG_BICGSTAB) ret = clbicgstab(m, B);
        else if (solver_id == CLCG_TFQMR) ret = cltfqmr(m, B);
        else throw std::invalid_argument("Invalid solver type. gctl::clcg_solver<T>::Minimize(...)");
        if (ret < 0) clcg_error_str(ret, ss, true);
        return;
    }
 #ifdef GCTL_OPENMP
    double start = omp_get_wtime();
    clcg_return_code ret;
    if (solver_id == CLCG_BICG) ret = clbicg(m, B);
    else if (solver_id == CLCG_BICG_SYM) ret = clbicg_symmetric(m, B);
    else if (solver_id == CLCG_CGS) ret = clcgs(m, B);
    else if (solver_id == CLCG_BICGSTAB) ret = clbicgstab(m, B);
    else if (solver_id == CLCG_TFQMR) ret = cltfqmr(m, B);
    else throw std::invalid_argument("Invalid solver type. gctl::clcg_solver<T>::Minimize(...)");
    double end = omp_get_wtime();
    double costime = 1000*(end-start);
 #else
    clock_t start = clock();
    clcg_return_code ret;
    if (solver_id == CLCG_BICG) ret = clbicg(m, B);
    else if (solver_id == CLCG_BICG_SYM) ret = clbicg_symmetric(m, B);
    else if (solver_id == CLCG_CGS) ret = clcgs(m, B);
    else if (solver_id == CLCG_BICGSTAB) ret = clbicgstab(m, B);
    else if (solver_id == CLCG_TFQMR) ret = cltfqmr(m, B);
    else throw std::invalid_argument("Invalid solver type. gctl::clcg_solver<T>::Minimize(...)");
    clock_t end = clock();
    double costime = 1000*(end-start)/(double)CLOCKS_PER_SEC;
 #endif
    if (!er_throw)
    {
        ss << std::endl;
        switch (solver_id)
 		{
 			case CLCG_BICG:
 				std::clog << "Solver: Bi-CG. Times cost: " << costime << " ms" << std::endl;
 				break;
 			case CLCG_BICG_SYM:
 				std::clog << "Solver: Bi-CG (symmetrically accelerated). Times cost: " << costime << " ms" << std::endl;
 				break;
 			case CLCG_CGS:
 				std::clog << "Solver: CGS. Times cost: " << costime << " ms" << std::endl;
 				break;
            case CLCG_BICGSTAB:
 				std::clog << "Solver: CGS. Times cost: " << costime << " ms" << std::endl;
 				break;
 			case CLCG_TFQMR:
 				std::clog << "Solver: TFQMR. Times cost: " << costime << " ms" << std::endl;
 				break;
 			default:
 				std::clog << "Solver: Unknown. Times cost: " << costime << " ms" << std::endl;
 				break;
 		}
    }
    if (verbose) clcg_error_str(ret, ss, er_throw);
    else if (ret < 0) clcg_error_str(ret, ss, er_throw);
    return;
 }
 gctl::clcg_return_code gctl::clcg_solver::clbicg(array<std::complex<double> > &m, const array<std::complex<double> > &B)
 {
    clcg_return_code ret;
    return ret;
 }
 gctl::clcg_return_code gctl::clcg_solver::clbicg_symmetric(array<std::complex<double> > &m, const array<std::complex<double> > &B)
 {
 	size_t n_size = B.size();
 	//check parameters
 	if (n_size <= 0) return CLCG_INVILAD_VARIABLE_SIZE;
 	if (clcg_param_.max_iterations < 0) return CLCG_INVILAD_MAX_ITERATIONS;
 	if (clcg_param_.epsilon <= 0.0 || clcg_param_.epsilon >= 1.0) return CLCG_INVILAD_EPSILON;
 	r1k.resize(n_size);
    d1k.resize(n_size);
 	Ax.resize(n_size);
 	CLCG_Ax(m, Ax, gctl::NoTrans, gctl::NoConj);
    std::complex<double> one_z(1.0, 0.0);
    vecdiff(r1k, B, Ax, one_z, one_z);
    veccpy(d1k, r1k, one_z);
 	std::complex<double> rkrk = vecdot(r1k, r1k);
 	double r0_square, rk_square;
 	std::complex<double> r0_mod, rk_mod;
 	rk_mod = vecinner(r1k, r1k);
 	r0_square = rk_square = std::norm(rk_mod);
 	if (r0_square < 1.0) r0_square = 1.0;
 	clcg_return_code ret;
 	if (clcg_param_.abs_diff && sqrt(rk_square)/n_size <= clcg_param_.epsilon)
 	{
 		ret = CLCG_ALREADY_OPTIMIZIED;
        CLCG_Progress(m, sqrt(rk_square)/n_size, clcg_param_, 0);
 		return ret;
 	}	
 	else if (rk_square/r0_square <= clcg_param_.epsilon)
 	{
 		ret = CLCG_ALREADY_OPTIMIZIED;
        CLCG_Progress(m, rk_square/r0_square, clcg_param_, 0);
 		return ret;
 	}
 	double residual;
    std::complex<double> ak, rkrk2, betak, dkAx;
    size_t t = 0;
 	while(1)
 	{
 		if (clcg_param_.abs_diff) residual = sqrt(rk_square)/n_size;
 		else residual = rk_square/r0_square;
        if (CLCG_Progress(m, residual, clcg_param_, t))
        {
            ret = CLCG_STOP; return ret;
        }
 		if (residual <= clcg_param_.epsilon)
 		{
 			ret = CLCG_CONVERGENCE; return ret;
 		}
 		if (clcg_param_.max_iterations > 0 && t+1 > clcg_param_.max_iterations)
 		{
 			ret = CLCG_REACHED_MAX_ITERATIONS;
 			break;
 		}
 		t++;
 		CLCG_Ax(d1k, Ax, gctl::NoTrans, gctl::NoConj);
 		dkAx = vecdot(d1k, Ax);
 		ak = rkrk/dkAx;
        vecapp(m, d1k, ak);
        vecsub(r1k, Ax, ak);
 		rk_mod = vecdot(r1k, r1k);
 		rk_square = std::norm(rk_mod);
        if (!vecvalid(m))
        {
            ret = CLCG_NAN_VALUE; return ret;
        }
 		rkrk2 = vecdot(r1k, r1k);
 		betak = rkrk2/rkrk;
 		rkrk = rkrk2;
        vecadd(d1k, d1k, r1k, betak, one_z);
 	}
 	return ret;
 }
 gctl::clcg_return_code gctl::clcg_solver::clcgs(array<std::complex<double> > &m, const array<std::complex<double> > &B)
 {
 	clcg_return_code ret;
    return ret;
 }
 gctl::clcg_return_code gctl::clcg_solver::clbicgstab(array<std::complex<double> > &m, const array<std::complex<double> > &B)
 {
 	clcg_return_code ret;
    return ret;
 }
 gctl::clcg_return_code gctl::clcg_solver::cltfqmr(array<std::complex<double> > &m, const array<std::complex<double> > &B)
 {
 	clcg_return_code ret;
    return ret;
 }
--- a/lib/optimization/clcg.h
+++ b/lib/optimization/clcg.h
@ -0,0 +1,166 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_CLCG_H
 #define _GCTL_CLCG_H
 #include "gctl/core.h"
 #include "gctl/maths.h"
 #include "gctl/algorithm.h"
 #include "gctl_optimization_config.h"
 #ifdef GCTL_OPTIMIZATION_TOML
 #include "toml.hpp"
 #endif // GCTL_OPTIMIZATION_TOML
 #if defined _WINDOWS || __WIN32__
 #include "windows.h"
 #endif // _WINDOWS || __WIN32__
 namespace gctl
 {
    /**
     * @brief      Types of method that could be recognized by the clcg_solver() function.
     */
    enum clcg_solver_type
    {
        /**
         * Jacob's Bi-Conjugate Gradient Method
         */
        CLCG_BICG,
        /**
         * Bi-Conjugate Gradient Method accelerated for complex symmetric A
         */
        CLCG_BICG_SYM,
        /**
         * Conjugate Gradient Squared Method with real coefficients.
         */
        CLCG_CGS,
        /**
         * Biconjugate gradient method.
         */
        CLCG_BICGSTAB,
        /**
         * Transpose Free Quasi-Minimal Residual Method
         */
        CLCG_TFQMR,
    };
    /**
     * @brief      return value of the clcg_solver() function
     */
    enum clcg_return_code
    {
        CLCG_SUCCESS = 0, ///< The solver function terminated successfully.
        CLCG_CONVERGENCE = 0, ///< The iteration reached convergence.
        CLCG_STOP, ///< The iteration is stopped by the monitoring function.
        CLCG_ALREADY_OPTIMIZIED, ///< The initial solution is already optimized.
        // A negative number means a error
        CLCG_UNKNOWN_ERROR = -1024, ///< Unknown error.
        CLCG_INVILAD_VARIABLE_SIZE, ///< The variable size is negative
        CLCG_INVILAD_MAX_ITERATIONS, ///< The maximal iteration times is negative.
        CLCG_INVILAD_EPSILON, ///< The epsilon is negative.
        CLCG_REACHED_MAX_ITERATIONS, ///< Iteration reached maximal limit.
        CLCG_NAN_VALUE, ///< Nan value.
        CLCG_INVALID_POINTER, ///< Invalid pointer.
        CLCG_SIZE_NOT_MATCH, ///< Sizes of m and B do not match
        CLCG_UNKNOWN_SOLVER, ///< Unknown solver
    };
    /**
     * @brief      Parameters of the conjugate gradient methods.
     */
    struct clcg_para
    {
        /**
         * Maximal iteration times. The process will continue till the convergence is met
         * if this option is set to zero (default).
        */
        int max_iterations;
        /**
         * Epsilon for convergence test.
         * This parameter determines the accuracy with which the solution is to be found. 
         * A minimization terminates when ||g||/max(||g0||, 1.0) <= epsilon or sqrt(||g||)/N 
         * <= epsilon for the lcg_solver() function, where ||.|| denotes the Euclidean (L2) norm. 
         * The default value of epsilon is 1e-8. For box-constrained methods,the convergence test 
         * is implemented using ||P(m-g) - m|| <= epsilon, in which P is the projector that 
         * transfers m into the constrained domain.
        */
        double epsilon;
        /**
         * Whether to use absolute mean differences (AMD) between |Ax - B| to evaluate the process. 
         * The default value is false which means the gradient based evaluating method is used. 
         * The AMD based method will be used if this variable is set to true. This parameter is only 
         * applied to the non-constrained methods.
         */
        int abs_diff;
    };
    class clcg_solver
    {
    private:
        clcg_para clcg_param_;
 		size_t clcg_inter_;
 		bool clcg_silent_;
        array<std::complex<double> > r1k, r2k, d1k, d2k;
 	    array<std::complex<double> > Ax;
    public:
        clcg_solver();
        virtual ~clcg_solver();
        virtual void CLCG_Ax(const array<std::complex<double> > &x, array<std::complex<double> > &ax, 
            matrix_layout_e layout, conjugate_type_e conj) = 0;
        virtual int CLCG_Progress(const array<std::complex<double> > &m, const double converge, const clcg_para &param, size_t t);
        void clcg_silent();
 		void set_clcg_report_interval(size_t inter);
 		void set_clcg_para(const clcg_para &param);
 		void clcg_error_str(clcg_return_code err_code, std::ostream &ss = std::clog, bool err_throw =  false);
 		clcg_para default_clcg_para();
 #ifdef GCTL_OPTIMIZATION_TOML
        void set_clcg_para(const toml::value &toml_data);
 #endif // GCTL_OPTIMIZATION_TOML
        clcg_return_code clbicg(array<std::complex<double> > &m, const array<std::complex<double> > &B);
        clcg_return_code clbicg_symmetric(array<std::complex<double> > &m, const array<std::complex<double> > &B);
        clcg_return_code clcgs(array<std::complex<double> > &m, const array<std::complex<double> > &B);
        clcg_return_code clbicgstab(array<std::complex<double> > &m, const array<std::complex<double> > &B);
        clcg_return_code cltfqmr(array<std::complex<double> > &m, const array<std::complex<double> > &B);
        void CLCG_Minimize(array<std::complex<double> > &m, const array<std::complex<double> > &B, 
            clcg_solver_type solver_id = CLCG_CGS, std::ostream &ss = std::clog, 
            bool verbose = true, bool er_throw = false);
    };
 }
 #endif // _GCTL_CLCG_H
--- a/lib/optimization/dwa.cpp
+++ b/lib/optimization/dwa.cpp
@ -0,0 +1,129 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "dwa.h"
 gctl::dwa::dwa()
 {
    fx_c_ = 0;
    l_ready_ = false;
 }
 gctl::dwa::~dwa(){}
 void gctl::dwa::InitDWA(size_t num, size_t grad_num)
 {
    fx_n_ = num;
    K_ = 1.0*num;
    T_ = 1.0;
    wgts_.resize(num, 1.0);
    L_p1_.resize(num, 1.0);
    L_p2_.resize(num, 1.0);
    grad_.resize(grad_num, 0.0);
    rcd_wgts_.push_back(wgts_);
    return;
 }
 void gctl::dwa::AddSingleLoss(double fx, const array<double> &g)
 {
    multi_fx_ += wgts_[fx_c_]*fx;
    L_p2_[fx_c_] = L_p1_[fx_c_];
    L_p1_[fx_c_] = fx;
    for (size_t i = 0; i < g.size(); i++)
    {
        grad_[i] += wgts_[fx_c_]*g[i];
    }
    fx_c_++;
    return;
 }
 void gctl::dwa::UpdateWeights()
 {
    double sum = 0.0;
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (l_ready_) wgts_[i] = exp(L_p1_[i]/(L_p2_[i]*T_));
        else wgts_[i] = 1.0;
        sum += wgts_[i];
    }
    for (size_t i = 0; i < fx_n_; i++)
    {
        wgts_[i] *= K_/sum;
    }
    l_ready_ = true;
    rcd_wgts_.push_back(wgts_);
    return;
 }
 double gctl::dwa::DWALoss(array<double> &g)
 {
    if (fx_c_ != fx_n_)
    {
        throw std::runtime_error("Not enough loss functions evaluated. From gctl::dwa::UpdateWeights()");
    }
    double fx = multi_fx_;
    g = grad_;
    fx_c_ = 0;
    multi_fx_ = 0.0;
    grad_.assign_all(0.0);
    return fx;
 }
 void gctl::dwa::set_control_temperature(double t)
 {
    T_ = t;
    return;
 }
 void gctl::dwa::set_normal_sum(double k)
 {
    K_ = k;
    return;
 }
 void gctl::dwa::get_records(array<double> &logs)
 {
    logs.resize(fx_n_*rcd_wgts_.size());
    for (size_t i = 0; i < rcd_wgts_.size(); i++)
    {
        for (size_t j = 0; j < fx_n_; j++)
        {
            logs[i*fx_n_ + j] = rcd_wgts_[i][j];
        }
    }
    return;
 }
--- a/lib/optimization/dwa.h
+++ b/lib/optimization/dwa.h
@ -0,0 +1,114 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_DWA_H
 #define _GCTL_DWA_H
 #include "gctl/core.h"
 namespace gctl
 {
    /**
     * @brief Lost balanced multitask evaluation.
     * 
     * @note Reference: 2019. End-to-end multitask learning with attention.
     * 
     */
    class dwa
    {
    private:
        bool l_ready_;
        size_t fx_c_, fx_n_;
        double K_, T_, multi_fx_;
        array<double> wgts_;
        array<double> L_p1_, L_p2_;
        array<double> grad_;
        std::vector<array<double>> rcd_wgts_;
    public:
        dwa();
        virtual ~dwa();
        /**
         * @brief Initiate the number of loss functions and size of the model gradients.
         * 
         * @note  This function must be called at first.
         * 
         * @param num Number of the loss functions
         * @param grad_num Size of the model gradients
         */
        void InitDWA(size_t num, size_t grad_num);
        /**
         * @brief Add the value of a single loss function and the current model gradients.
         * 
         * @param fx objective value
         * @param g model gradients
         */
        void AddSingleLoss(double fx, const array<double> &g);
        /**
         * @brief Get the merged objective value and the model gradients.
         * 
         * @note All single loss functions must be added before calling this function. The merged objective value and the model gradients will be reset after the calling.
         * 
         * @param g model gradients
         * 
         * @return objective value
         */
        double DWALoss(array<double> &g);
        /**
         * @brief Update weights for single loss functions using the DWA algorithm.
         * 
         */
        void UpdateWeights();
        /**
         * @brief Set the cooling temperature. The bigger value is, the closer the weights will be to one. The default is 1.0.
         * 
         * @param t Input temperature
         */
        void set_control_temperature(double t);
        /**
         * @brief Set the normal sum of the weights. Ths default equals to function size.
         * 
         * @param k Input sum
         */
        void set_normal_sum(double k);
        /**
         * @brief Get the recorded weights. Size of the log equals the function size times iteration times.
         * 
         * @param logs Output log
         */
        void get_records(array<double> &logs);
    };
 }
 #endif // _GCTL_DWA_H
--- a/lib/optimization/gctl_optimization_config.h
+++ b/lib/optimization/gctl_optimization_config.h
@ -0,0 +1 @@
 #define GCTL_OPTIMIZATION_TOML
--- a/lib/optimization/gradnorm.cpp
+++ b/lib/optimization/gradnorm.cpp
@ -0,0 +1,328 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "gradnorm.h"
 gctl::grad_norm::grad_norm()
 {
    fx_c_ = 0;
    alpha_ = 1.0;
    lamda_ = 0.001;
    initialized_ = false;
 }
 gctl::grad_norm::~grad_norm(){}
 void gctl::grad_norm::InitGradNorm(size_t num, size_t grad_num)
 {
    fx_n_ = num;
    T_ = 1.0;
    resi_T_ = 0.0;
    fst_iter_.resize(num, true);
    wgts_.resize(num, 1.0/num);
    fx0_.resize(num, 0.0);
    Gw_.resize(num, 0.0);
    Gdw_.resize(num, 0.0);
    Lx_.resize(num, 0.0);
    grad_.resize(grad_num, 0.0);
    rcd_fxs_.resize(num, 0.0);
    fixed_wgts_.resize(num, -1.0);
    rcd_wgts_.reserve(100000);
    for (size_t i = 0; i < fx_n_; i++)
    {
        rcd_wgts_.push_back(wgts_[i]);
    }
    initialized_ = true;
    return;
 }
 double gctl::grad_norm::AddSingleLoss(double fx, const array<double> &g)
 {
    if (fst_iter_[fx_c_])
    {
        fx0_[fx_c_] = fx;
        fst_iter_[fx_c_] = false;
    }
    Lx_[fx_c_] = fx/fx0_[fx_c_];
    double curr_fx = wgts_[fx_c_]*fx;
    multi_fx_ += curr_fx;
    rcd_fxs_[fx_c_] = fx;
    double sum = 0.0;
    for (size_t i = 0; i < g.size(); i++)
    {
        sum += g[i]*g[i];
        grad_[i] += wgts_[fx_c_]*g[i];
    }
    Gw_[fx_c_] = sqrt(wgts_[fx_c_]*wgts_[fx_c_]*sum);
    Gdw_[fx_c_] = sqrt(sum); // wgts_[fx_c_]*sum/Gw_[fx_c_]
    fx_c_++;
    return curr_fx;
 }
 void gctl::grad_norm::UpdateWeights()
 {
    double ac = 0;
    double avg_Lx = 0.0, avg_Gw = 0.0;
    resi_T_ = T_;
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (fixed_wgts_[i] < 0.0)
        {
            avg_Lx += Lx_[i];
            avg_Gw += Gw_[i];
            ac += 1.0;
        }
        else resi_T_ -= fixed_wgts_[i];
    }
    avg_Lx /= ac;
    avg_Gw /= ac;
    double r_i, sum = 0.0;
    // L1 norm approach
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (fixed_wgts_[i] < 0.0)
        {
            r_i = Lx_[i]/avg_Lx;
            if (Gw_[i] >= avg_Gw*pow(r_i, alpha_))
            {
                wgts_[i] -= lamda_*Gdw_[i];
            }
            else wgts_[i] += lamda_*Gdw_[i];
            // make sure the weights are positive
            wgts_[i] = std::max(wgts_[i], 1e-16);
            sum += wgts_[i];
        }
    }
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (fixed_wgts_[i] < 0.0) wgts_[i] *= resi_T_/sum;
        rcd_wgts_.push_back(wgts_[i]);
    }
    return;
 }
 void gctl::grad_norm::ShowStatistics(std::ostream &ss, bool one_line)
 {
    double s, t = 0.0;
    if (one_line)
    {
        ss << "Wgts:";
        for (size_t i = 0; i < fx_n_; i++)
        {
            ss << " " << wgts_[i];
        }
        ss << ", Loss:";
        for (size_t i = 0; i < fx_n_; i++)
        {
            ss << " " << rcd_fxs_[i];
        }
        ss << ", WgtLoss:";
        for (size_t i = 0; i < fx_n_; i++)
        {
            s = wgts_[i]*rcd_fxs_[i];
            ss << " " << s;
            t += s;
        }
        ss << ", Total: " << t << "\n";
        return;
    }
    ss << "----------------------------\n";
    ss << "GradNorm's Progress\n";
    ss << "Tasks' weight: ";
    for (size_t i = 0; i < fx_n_; i++)
    {
        ss << wgts_[i] << " | ";
    }
    ss << "\n";
    ss << "Tasks' loss: ";
    for (size_t i = 0; i < fx_n_; i++)
    {
        ss << rcd_fxs_[i] << " | ";
    }
    ss << "\n";
    ss << "Weighted losses: ";
    for (size_t i = 0; i < fx_n_; i++)
    {
        s = wgts_[i]*rcd_fxs_[i];
        ss << s << " | ";
        t += s;
    }
    ss << t << " (total) |\n";
    ss << "----------------------------\n";
    return;
 }
 double gctl::grad_norm::GradNormLoss(array<double> &g)
 {
    if (fx_c_ != fx_n_)
    {
        throw std::runtime_error("Not all loss functions evaluated. From gctl::grad_norm::GradNormLoss()");
    }
    if (!initialized_)
    {
        throw std::runtime_error("GradNorm is not initialized. From gctl::grad_norm::GradNormLoss()");
    }
    double fx = multi_fx_;
    g = grad_;
    fx_c_ = 0;
    multi_fx_ = 0.0;
    grad_.assign_all(0.0);
    return fx;
 }
 void gctl::grad_norm::set_control_weight(double a)
 {
    alpha_ = a;
    return;
 }
 void gctl::grad_norm::set_normal_sum(double t)
 {
    T_ = t;
    return;
 }
 void gctl::grad_norm::set_weight_step(double l)
 {
    lamda_ = l;
    return;
 }
 void gctl::grad_norm::set_fixed_weight(int id, double wgt)
 {
    if (id < 0 || id >= fx_n_)
    {
        throw std::runtime_error("Invalid loss function's index. From gctl::grad_norm::set_fixed_weight(...)");
    }
    if (wgt <= 0.0 || wgt >= T_)
    {
        throw std::runtime_error("Invalid fixed weight value. From gctl::grad_norm::set_fixed_weight(...)");
    }
    fixed_wgts_[id] = wgt;
    wgts_[id] = wgt;
    resi_T_ = T_;
    double ac = 0.0;
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (fixed_wgts_[i] > 0.0) resi_T_ -= fixed_wgts_[i];
        else ac += 1.0;
    }
    if (resi_T_ <= 0.0)
    {
        throw std::runtime_error("Invalid tasks' weight detected. From gctl::grad_norm::UpdateWeights()");
    }
    for (size_t i = 0; i < fx_n_; i++)
    {
        if (fixed_wgts_[i] < 0.0) wgts_[i] = resi_T_/ac;
    }
    for (size_t i = 0; i < fx_n_; i++)
    {
        rcd_wgts_[i] = wgts_[i];
    }
    return;
 }
 void gctl::grad_norm::set_initial_weights(const array<double> &w)
 {
    if (w.size() != fx_n_)
    {
        throw std::runtime_error("Invalid input array size. From gctl::grad_norm::set_initial_weights(...)");
    }
    double sum = 0.0;
    for (size_t i = 0; i < fx_n_; i++)
    {
        wgts_[i] = w[i];
        sum += wgts_[i];
    }
    for (size_t i = 0; i < fx_n_; i++)
    {
        wgts_[i] *= T_/sum;
        rcd_wgts_[i] = wgts_[i];
    }
    return;
 }
 void gctl::grad_norm::get_records(array<double> &logs)
 {
    logs.resize(rcd_wgts_.size());
    for (size_t i = 0; i < rcd_wgts_.size(); i++)
    {
        logs[i] = rcd_wgts_[i];
    }
    return;
 }
 void gctl::grad_norm::save_records(std::string file)
 {
    std::ofstream ofile;
    open_outfile(ofile, file, ".txt");
    ofile << "# 'tw' for 'task weight'\n# ";
    for (size_t j = 0; j < fx_n_; j++)
    {
        ofile << "tw" << std::to_string(j) << " ";
    }
    ofile << "\n";
    for (int i = 0; i < rcd_wgts_.size(); i++)
    {
        ofile << rcd_wgts_[i] << " ";
        if ((i+1)%fx_n_ == 0) ofile << "\n";
    }
    ofile.close();
 }
--- a/lib/optimization/gradnorm.h
+++ b/lib/optimization/gradnorm.h
@ -0,0 +1,159 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_GRADNORM_H
 #define _GCTL_GRADNORM_H
 #include "gctl/core.h"
 #include "gctl/io.h"
 namespace gctl
 {
    /**
     * @brief Gradient normalized (balanced) multitask evaluation.
     * 
     * @note Reference: Zhao Chen et. al., 2018. GradNorm: Gradient normalization 
     * for adaptive loss balancing in deep multitask networks.
     * 
     */
    class grad_norm
    {
    private:
        bool initialized_;
        size_t fx_n_, fx_c_;
        double resi_T_, T_;
        double lamda_, alpha_, multi_fx_;
        array<bool> fst_iter_;
        array<double> wgts_;
        array<double> fx0_;
        array<double> Gw_, Gdw_, Lx_;
        array<double> grad_;
        array<double> rcd_fxs_;
        array<double> fixed_wgts_;
        std::vector<double> rcd_wgts_;
    public:
        grad_norm();
        virtual ~grad_norm();
        /**
         * @brief Initiate the number of loss functions and size of the model gradients.
         * 
         * @note  This function must be called at first.
         * 
         * @param num Number of the total loss functions
         * @param grad_num Size of the model gradients
         */
        void InitGradNorm(size_t num, size_t grad_num);
        /**
         * @brief Add the value of a single loss function and the current model gradients.
         * 
         * @param fx objective value
         * @param g model gradients
         * 
         * @return weighted value of the current loss function
         */
        double AddSingleLoss(double fx, const array<double> &g);
        /**
         * @brief Get the merged objective value and the model gradients.
         * 
         * @note All single loss functions must be added before calling this function. The 
         * merged objective value and the model gradients will be reset after the calling.
         * 
         * @param g model gradients
         * 
         * @return objective value
         */
        double GradNormLoss(array<double> &g);
        /**
         * @brief Update weights for single loss functions using the GradNorm algorithm.
         * 
         */
        void UpdateWeights();
        /**
         * @brief Show statistics of the tasks' weight and loss function's value.
         * 
         */
        void ShowStatistics(std::ostream &ss = std::clog, bool one_line = false);
        /**
         * @brief Set the control factor alpha. The default is 1.0
         * 
         * @param a Input alpha
         */
        void set_control_weight(double a);
        /**
         * @brief Set the normal sum of the weights. Ths default equals to function size.
         * 
         * @param t Input sum
         */
        void set_normal_sum(double t);
        /**
         * @brief Set a learning rate of the weights. The default is 0.001
         * 
         * @param l Input learning rate
         */
        void set_weight_step(double l);
        /**
         * @brief Set the fixed weight.
         * 
         * @param id Index of the loss function
         * @param wgt weight of the loss function
         */
        void set_fixed_weight(int id, double wgt);
        /**
         * @brief Set the initial weights
         * 
         * @param w Input weights
         */
        void set_initial_weights(const array<double> &w);
        /**
         * @brief Get the recorded weights. Size of the log equals the function size times iteration times.
         * 
         * @param logs Output log
         */
        void get_records(array<double> &logs);
        /**
         * @brief Save recored weights to file.
         * 
         * @param file File name
         */
        void save_records(std::string file);
    };
 }
 #endif // _GCTL_GRADNORM_H
--- a/lib/optimization/lbfgs.cpp
+++ b/lib/optimization/lbfgs.cpp
--- a/lib/optimization/lbfgs.h
+++ b/lib/optimization/lbfgs.h
@ -0,0 +1,559 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_LBFGS_H
 #define _GCTL_LBFGS_H
 #include "gctl/core.h"
 #include "gctl/maths.h"
 #include "gctl/algorithm.h"
 #include "gctl_optimization_config.h"
 #ifdef GCTL_OPTIMIZATION_TOML
 #include "toml.hpp"
 #endif // GCTL_OPTIMIZATION_TOML
 #if defined _WINDOWS || __WIN32__
 #include "windows.h"
 #endif // _WINDOWS || __WIN32__
 namespace gctl
 {
    /**
 	 * @brief      Return value of the lbfgs() function. Roughly speaking, a negative value indicates an error.
 	 */
 	enum lbfgs_return_code
    {
        /** L-BFGS reaches convergence. */
        LBFGS_EPS_CONVERGENCE = 0,
        LBFGS_DELTA_CONVERGENCE,
        LBFGS_RESI_CONVERGENCE,
        LBFGS_STOP, //1
        /** The initial variables already minimize the objective function. */
        LBFGS_ALREADY_MINIMIZED, //2
        /** Unknown error. */
        LBFGSERR_UNKNOWNERROR = -1024,
        /** Logic error. */
        LBFGSERR_LOGICERROR, //-1023
        /** Insufficient memory. */
        LBFGSERR_OUTOFMEMORY, //-1022
        /** The minimization process has been canceled. */
        LBFGSERR_CANCELED,
        /** Invalid number of variables specified. */
        LBFGSERR_INVALID_N,
        /** Invalid number of variables (for SSE) specified. */
        LBFGSERR_INVALID_N_SSE,
        /** The array x must be aligned to 16 (for SSE). */
        LBFGSERR_INVALID_X_SSE,
        /** Invalid parameter lbfgs_para::epsilon specified. */
        LBFGSERR_INVALID_EPSILON,
        /** Invalid parameter lbfgs_para::past specified. */
        LBFGSERR_INVALID_TESTPERIOD,
        /** Invalid parameter lbfgs_para::delta specified. */
        LBFGSERR_INVALID_DELTA,
        /** Invalid parameter lbfgs_para::linesearch specified. */
        LBFGSERR_INVALID_LINESEARCH,
        /** Invalid parameter lbfgs_para::max_step specified. */
        LBFGSERR_INVALID_MINSTEP,
        /** Invalid parameter lbfgs_para::max_step specified. */
        LBFGSERR_INVALID_MAXSTEP,
        /** Invalid parameter lbfgs_para::ftol specified. */
        LBFGSERR_INVALID_FTOL,
        /** Invalid parameter lbfgs_para::wolfe specified. */
        LBFGSERR_INVALID_WOLFE,
        /** Invalid parameter lbfgs_para::gtol specified. */
        LBFGSERR_INVALID_GTOL,
        /** Invalid parameter lbfgs_para::xtol specified. */
        LBFGSERR_INVALID_XTOL,
        /** Invalid parameter lbfgs_para::max_linesearch specified. */
        LBFGSERR_INVALID_MAXLINESEARCH,
        /** Invalid parameter lbfgs_para::orthantwise_c specified. */
        LBFGSERR_INVALID_ORTHANTWISE,
        /** Invalid parameter lbfgs_para::orthantwise_start specified. */
        LBFGSERR_INVALID_ORTHANTWISE_START,
        /** Invalid parameter lbfgs_para::orthantwise_end specified. */
        LBFGSERR_INVALID_ORTHANTWISE_END,
        /** The line-search step went out of the interval of uncertainty. */
        LBFGSERR_OUTOFINTERVAL,
        /** A logic error occurred; alternatively, the interval of uncertainty
            became too small. */
        LBFGSERR_INCORRECT_TMINMAX,
        /** A rounding error occurred; alternatively, no line-search step
            satisfies the sufficient decrease and curvature conditions. */
        LBFGSERR_ROUNDING_ERROR,
        /** The line-search step became smaller than lbfgs_para::min_step. */
        LBFGSERR_MINIMUMSTEP,
        /** The line-search step became larger than lbfgs_para::max_step. */
        LBFGSERR_MAXIMUMSTEP,
        /** The line-search routine reaches the maximum number of evaluations. */
        LBFGSERR_MAXIMUMLINESEARCH,
        /** The algorithm routine reaches the maximum number of iterations. */
        LBFGSERR_MAXIMUMITERATION,
        /** Relative width of the interval of uncertainty is at most
            lbfgs_para::xtol. */
        LBFGSERR_WIDTHTOOSMALL,
        /** A logic error (negative line-search step) occurred. */
        LBFGSERR_INVALIDPARAMETERS,
        /** The current search direction increases the objective function value. */
        LBFGSERR_INCREASEGRADIENT,
    };
    // 枚举类型 线性搜索方法
    // 0 MoreThuente方法
    // 1 Armijo条件方法
    // 2 标准Wolfe条件方法
    // 3 增强Wolfe条件方法
    /**
     * @brief      Line search algorithms.
     */
    enum line_search_type
    {
        /** The default algorithm (MoreThuente method). */
        LBFGS_LINESEARCH_DEFAULT = 0,
        /** MoreThuente method proposd by More and Thuente. */
        LBFGS_LINESEARCH_MORETHUENTE = 0,
        /**
         * Backtracking method with the Armijo condition.
         *  The backtracking method finds the step length such that it satisfies
         *  the sufficient decrease (Armijo) condition,
         *    - f(x + a * d) <= f(x) + lbfgs_para::ftol * a * g(x)^T d,
         *
         *  where x is the current point, d is the current search direction, and
         *  a is the step length.
         */
        LBFGS_LINESEARCH_BACKTRACKING_ARMIJO = 1,
        /** The backtracking method with the defualt (regular Wolfe) condition. */
        LBFGS_LINESEARCH_BACKTRACKING = 2,
        /**
         * Backtracking method with regular Wolfe condition.
         *  The backtracking method finds the step length such that it satisfies
         *  both the Armijo condition (LBFGS_LINESEARCH_BACKTRACKING_ARMIJO)
         *  and the curvature condition,
         *    - g(x + a * d)^T d >= lbfgs_para::wolfe * g(x)^T d,
         *
         *  where x is the current point, d is the current search direction, and
         *  a is the step length.
         */
        LBFGS_LINESEARCH_BACKTRACKING_WOLFE = 2,
        /**
         * Backtracking method with strong Wolfe condition.
         *  The backtracking method finds the step length such that it satisfies
         *  both the Armijo condition (LBFGS_LINESEARCH_BACKTRACKING_ARMIJO)
         *  and the following condition,
         *    - |g(x + a * d)^T d| <= lbfgs_para::wolfe * |g(x)^T d|,
         *
         *  where x is the current point, d is the current search direction, and
         *  a is the step length.
         */
        LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE = 3,
        LBFGS_LINESEARCH_BACKTRACKING_ARMIJO_QUAD = 4,
        //LBFGS_LINESEARCH_BACKTRACKING_QUAD = 5,
        //LBFGS_LINESEARCH_BACKTRACKING_WOLFE_QUAD = 5,
        //LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE_QUAD = 6,
    };
    // L-BFGS参数类型。参数很多，简要说明如下：
    // m L-BFGS算法中储存的前序sk与yk向量个数，这个值控制了算法使用的内存多少，默认值为6（不建议小于3的值），值多大近似精度越高，计算量也越大。
    // epsilon 迭代的终止精度，默认值为1e-5
    // past 以delta(不同迭代次数的目标函数值)为基础的迭代终止条件数，past代表了以多少迭代次数之前的目标函数值作为delta计算的间隔，默认值为0，
    //      即不以delta为迭代终止条件。
    // delta (f' - f) / f 不同迭代次数时目标函数之差与当前目标函数值之比，但past不为0时会计算。
    // max_iterations 最大迭代次数，为0时表示一直迭代到终止条件被满足或出现其他错误。
    // linesearch 线性搜索方式，由此文件前述枚举类型定义。
    // max_linesearch 每次迭代中线性搜索的最大次数，默认值为40
    // min_step 线性搜索中的最小步长，默认值为1e-20
    // max_step 线性搜索中的最大步长，默认值为1e+20
    // ftol 线性搜索的精度值，默认值为1e-4，取值范围（0-0.5）。
    // wolfe Wolfe线性搜索中的控制参数，默认值为0.9，大于ftol小于1.0
    // gtol 线性搜索中的控制参数，默认值为0.9，大于ftol小于1.0
    // xtol 浮点数精度，默认值为1e-16
    // orthantwise_c 模型参数x的L1模的乘积参数，默认值为0.0，此时算法即为L2模形式，当此参数大于0时，算法即为OWL-QN
    // orthantwise_start 开始计算模型参数x的L1模的迭代序号
    // orthantwise_end 终止计算模型参数x的L1模的迭代序号
    /**
     * L-BFGS optimization parameters.
     *  Call lbfgs_parameter_init() function to initialize parameters to the
     *  default values.
     */
    struct lbfgs_para
    {
        /**
         * The number of corrections to approximate the inverse hessian matrix.
         *  The L-BFGS routine stores the computation results of previous \ref m
         *  iterations to approximate the inverse hessian matrix of the current
         *  iteration. This parameter controls the size of the limited memories
         *  (corrections). The default value is \c 6. Values less than \c 3 are
         *  not recommended. Large values will result in excessive computing time.
         */
        int m;
        /**
         * Epsilon for convergence test.
         *  This parameter determines the accuracy with which the solution is to
         *  be found. A minimization terminates when
         *      ||g|| < \ref epsilon * max(1, ||x||),
         *  where ||.|| denotes the Euclidean (L2) norm. The default value is
         *  \c 1e-5.
         */
        double epsilon;
        /**
         * Distance for delta-based convergence test.
         *  This parameter determines the distance, in iterations, to compute
         *  the rate of decrease of the objective function. If the value of this
         *  parameter is zero, the library does not perform the delta-based
         *  convergence test. The default value is \c 0.
         */
        int past;
        /**
         * Delta for convergence test.
         *  This parameter determines the minimum rate of decrease of the
         *  objective function. The library stops iterations when the
         *  following condition is met:
         *      (f' - f) / f < \ref delta,
         *  where f' is the objective value of \ref past iterations ago, and f is
         *  the objective value of the current iteration.
         *  The default value is \c 1e-5.
         */
        double delta;
        /**
         * Residual for convergence test.
         * This parameter determines the accuracy with which the solution is to
         * be found. A minimization terminates when
         *      f(x) <= residual,
         * The default value is \c 1e-8.
         * 
         */
        double residual;
        /**
         * The maximum number of iterations.
         *  The lbfgs() function terminates an optimization process with
         *  ::LBFGSERR_MAXIMUMITERATION status code when the iteration count
         *  exceedes this parameter. Setting this parameter to zero continues an
         *  optimization process until a convergence or error. The default value
         *  is \c 0.
         */
        int             max_iterations;
        /**
         * The line search algorithm.
         *  This parameter specifies a line search algorithm to be used by the
         *  L-BFGS routine.
         */
        int             linesearch;
        /**
         * The maximum number of trials for the line search.
         *  This parameter controls the number of function and gradients evaluations
         *  per iteration for the line search routine. The default value is \c 40.
         */
        int             max_linesearch;
        /**
         * The minimum step of the line search routine.
         *  The default value is \c 1e-20. This value need not be modified unless
         *  the exponents are too large for the machine being used, or unless the
         *  problem is extremely badly scaled (in which case the exponents should
         *  be increased).
         */
        double min_step;
        /**
         * The maximum step of the line search.
         *  The default value is \c 1e+20. This value need not be modified unless
         *  the exponents are too large for the machine being used, or unless the
         *  problem is extremely badly scaled (in which case the exponents should
         *  be increased).
         */
        double max_step;
        /**
         * A parameter to control the accuracy of the line search routine.
         *  The default value is \c 1e-4. This parameter should be greater
         *  than zero and smaller than \c 0.5.
         */
        double ftol;
        /**
         * A coefficient for the Wolfe condition.
         *  This parameter is valid only when the backtracking line-search
         *  algorithm is used with the Wolfe condition,
         *  ::LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE or
         *  ::LBFGS_LINESEARCH_BACKTRACKING_WOLFE .
         *  The default value is \c 0.9. This parameter should be greater
         *  the \ref ftol parameter and smaller than \c 1.0.
         */
        double wolfe;
        /**
         * A parameter to control the accuracy of the line search routine.
         *  The default value is \c 0.9. If the function and gradient
         *  evaluations are inexpensive with respect to the cost of the
         *  iteration (which is sometimes the case when solving very large
         *  problems) it may be advantageous to set this parameter to a small
         *  value. A typical small value is \c 0.1. This parameter shuold be
         *  greater than the \ref ftol parameter (\c 1e-4) and smaller than
         *  \c 1.0.
         */
        double gtol;
        /**
         * The machine precision for floating-point values.
         *  This parameter must be a positive value set by a client program to
         *  estimate the machine precision. The line search routine will terminate
         *  with the status code (::LBFGSERR_ROUNDING_ERROR) if the relative width
         *  of the interval of uncertainty is less than this parameter.
         */
        double xtol;
        /**
         * Coeefficient for the L1 norm of variables.
         *  This parameter should be set to zero for standard minimization
         *  problems. Setting this parameter to a positive value activates
         *  Orthant-Wise Limited-memory Quasi-Newton (OWL-QN) method, which
         *  minimizes the objective function F(x) combined with the L1 norm |x|
         *  of the variables, {F(x) + C |x|}. This parameter is the coeefficient
         *  for the |x|, i.e., C. As the L1 norm |x| is not differentiable at
         *  zero, the library modifies function and gradient evaluations from
         *  a client program suitably; a client program thus have only to return
         *  the function value F(x) and gradients G(x) as usual. The default value
         *  is zero.
         */
        double orthantwise_c;
        /**
         * Start index for computing L1 norm of the variables.
         *  This parameter is valid only for OWL-QN method
         *  (i.e., \ref orthantwise_c != 0). This parameter b (0 <= b < N)
         *  specifies the index number from which the library computes the
         *  L1 norm of the variables x,
         *      |x| := |x_{b}| + |x_{b+1}| + ... + |x_{N}| .
         *  In other words, variables x_1, ..., x_{b-1} are not used for
         *  computing the L1 norm. Setting b (0 < b < N), one can protect
         *  variables, x_1, ..., x_{b-1} (e.g., a bias term of logistic
         *  regression) from being regularized. The default value is zero.
         */
        int             orthantwise_start;
        /**
         * End index for computing L1 norm of the variables.
         *  This parameter is valid only for OWL-QN method
         *  (i.e., \ref orthantwise_c != 0). This parameter e (0 < e <= N)
         *  specifies the index number at which the library stops computing the
         *  L1 norm of the variables x,
         */
        int             orthantwise_end;
    };
    class lbfgs_solver
    {
    private:
        lbfgs_para lbfgs_param_; ///< lbfgs 算法参数
 		bool lbfgs_silent_; ///< 显示运行信息
        // 算法函数是私有的，不能直接使用，通过Minimize函数调用
        // 下面是L-BFGS的主函数，各个参数的说明简要翻译如下：
        // n 数组的长度，也就是待求的模型参数的数量
        // x 模型参数数组的指针，函数通过指针直接操作模型数组，所以不需要返回计算结果。一开始赋给函数的数组即为
        //   初始模型，函数结束后即为最优化结果
        // ptr_fx 目标函数的值的指针，设计成指针可以方便在函数外部监控迭代过程的收敛情况
        // retval 返回值。无错即为0，非0值代表此文件上部枚举类型中的对应错误。此文件下部定义的错误信息显示即利用此返回值与
        //        预定义的枚举类型输出相应的错误信息。
        /**
         * Start a L-BFGS optimization.
         *
         *  @param  x           The array of variables. A client program can set
         *                      default values for the optimization and receive the
         *                      optimization result through this array. This array
         *                      must be allocated by ::lbfgs_malloc function
         *                      for libLBFGS built with SSE/SSE2 optimization routine
         *                      enabled. The library built without SSE/SSE2
         *                      optimization does not have such a requirement.
         *  @param  ptr_fx      The pointer to the variable that receives the final
         *                      value of the objective function for the variables.
         *                      This argument can be set to \c NULL if the final
         *                      value of the objective function is unnecessary.
         *  @retval             The status code. This function returns zero if the
         *                      minimization process terminates without an error. A
         *                      non-zero value indicates an error.
         */
        lbfgs_return_code lbfgs(array<double> &x, double &ptr_fx, std::ostream &ss);
        lbfgs_return_code lbfgs_preconditioned(array<double> &x, double &ptr_fx, std::ostream &ss);
        // 线性搜索方法 内部私有函数 不能直接使用
        lbfgs_return_code line_search_backtracking(int n, gctl::array<double> &x, double *f, gctl::array<double> &g, gctl::array<double> &s, 
            double *stp, const gctl::array<double> &xp, const gctl::array<double> &gp, gctl::array<double> &wp, int &ls);
        lbfgs_return_code line_search_backtracking_quad(int n, gctl::array<double> &x, double *f, gctl::array<double> &g, gctl::array<double> &s, 
            double *stp, const gctl::array<double> &xp, const gctl::array<double> &gp, gctl::array<double> &wp, int &ls);
        lbfgs_return_code line_search_backtracking_owlqn(int n, gctl::array<double> &x, double *f, gctl::array<double> &g, gctl::array<double> &s, 
            double *stp, const gctl::array<double> &xp, const gctl::array<double> &gp, gctl::array<double> &wp, int &ls);
        lbfgs_return_code line_search_morethuente(int n, gctl::array<double> &x, double *f, gctl::array<double> &g, gctl::array<double> &s, 
            double *stp, const gctl::array<double> &xp, const gctl::array<double> &gp, gctl::array<double> &wa, int &ls);
        // 显示lbfgs函数返回值信息 主要是错误信息
        void lbfgs_error_str(lbfgs_return_code err_code, std::ostream &ss = std::clog, bool err_throw =  false);
    public:
        lbfgs_solver();
        virtual ~lbfgs_solver();
        /**
         * @brief 不显示运行信息，仅抛出运行错误。
         * 
         */
        void lbfgs_silent();
        /**
         * @brief 设置算法参数。
         * 
         * @param in_param 参数对象
         */
        void set_lbfgs_para(const lbfgs_para &in_param);
 #ifdef GCTL_OPTIMIZATION_TOML
        /**
         * @brief 设置算法参数。
         * 
         * @param toml_data toml数据对象 
         */
        void set_lbfgs_para(const toml::value &toml_data);
 #endif // GCTL_OPTIMIZATION_TOML
        /**
         * @brief 返回一个全为默认值的参数对象。
         * 
         * @return lbfgs_para 
         */
 		lbfgs_para default_lbfgs_para();
        /**
         * @brief 显示当前运行参数
         * 
         * @param ss 标准输出流
         */
        void show_lbfgs_para(std::ostream &ss = std::clog);
        // 目标函数与其梯度值计算函数的接口，参数简要说明如下：
        // x 当前的模型参数值的指针
        // g 当前模型参数值对应的梯度指针
        // step 当前线性搜索所使用的步长
        // retval 当前模型参数的目标函数值
        /**
         * Callback interface to provide objective function and gradient evaluations.
         *
         *  The lbfgs() function call this function to obtain the values of objective
         *  function and its gradients when needed. A client program must implement
         *  this function to evaluate the values of the objective function and its
         *  gradients, given current values of variables.
         *  
         *  @param  x           The current values of variables.
         *  @param  g           The gradient vector. The callback function must compute
         *                      the gradient values for the current variables.
         *  @param  step        The current step of the line search routine.
         *  @retval double The value of the objective function for the current
         *                          variables.
         */
        virtual double LBFGS_Evaluate(const array<double> &x, array<double> &g) = 0;
        /**
         * Callback interface to implement the preconditioning process.
         *
         *  The lbfgs() function call this function for each iteration. Implementing
         *  this function, a client program can preform the preconditioning process.
         *
         *  @param  x           The current values of variables.
         *  @param  g           The current gradient values of variables.
         *  @param  d           The current values of search directions.
         *  @param  d_pre       The values of search directions being preconditioned. 
         *                      The callback function must compute these values.
         */
        virtual void LBFGS_Precondition(const array<double> &x, const array<double> &g, const array<double> &d, array<double> &d_pre);
        // 进程函数的接口，参数简要说明如下：
        // x 当前的模型参数值的指针
        // g 当前模型参数值对应的梯度指针
        // fx 目标函数的值
        // xnorm 模型参数数组的L2模长
        // gnorm 模型梯度数组的L2模长
        // step 当前线性搜索所使用的步长
        // k 迭代的次数
        // ls 此次迭代所使用的线性搜索次数
        // retval 返回0则lbfgs()函数继续，否则终止
        /**
         * Callback interface to receive the progress of the optimization process.
         *
         *  The lbfgs() function call this function for each iteration. Implementing
         *  this function, a client program can store or display the current progress
         *  of the optimization process.
         *
         *  @param  x           The current values of variables.
         *  @param  g           The current gradient values of variables.
         *  @param  fx          The current value of the objective function.
         *  @param  converge    Current value of the convergence test.
         *  @param  rate        Current value of the delta-based convergence test.
         *  @param  param       这是我们添加了一个指针以使用参数类型来监控迭代流程
         *  @param  k           The iteration count.
         *  @param  ls          The number of evaluations called for this iteration.
         *  @param  ss          Output stream object.
         *  @retval int         Zero to continue the optimization process. Returning a
         *                      non-zero value will cancel the optimization process.
         */
        virtual int LBFGS_Progress(const array<double> &x, const array<double> &g, const double fx, 
            const double converge, const double rate, const lbfgs_para param, int k, int ls, std::ostream &ss);
        /**
         * @brief 调用算法执行最小化流程
         * 
         * @param m 初始模型，最优化结果也保存在此数组内
         * @param ss 信息的输出流
         * @param err_throw 仅抛出错误
         * @return double 最终的目标函数值
         */
        double LBFGS_Minimize(array<double> &m, std::ostream &ss = std::clog, bool err_throw = false);
        /**
         * @brief 调用算法执行最小化流程
         * 
         * @param m 初始模型，最优化结果也保存在此数组内
         * @param ss 信息的输出流
         * @param verbose 使用输出详细信息
         * @param err_throw 仅抛出错误
         * @return double 最终的目标函数值
         */
        double LBFGS_MinimizePreconditioned(array<double> &m, std::ostream &ss = std::clog, bool err_throw = false);
    };
 }
 #endif // _GCTL_LBFGS_H
--- a/lib/optimization/lcg.cpp
+++ b/lib/optimization/lcg.cpp
--- a/lib/optimization/lcg.h
+++ b/lib/optimization/lcg.h
@ -0,0 +1,387 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_LCG_H
 #define _GCTL_LCG_H
 #include "gctl/core.h"
 #include "gctl/maths.h"
 #include "gctl/algorithm.h"
 #include "gctl_optimization_config.h"
 #ifdef GCTL_OPTIMIZATION_TOML
 #include "toml.hpp"
 #endif // GCTL_OPTIMIZATION_TOML
 #if defined _WINDOWS || __WIN32__
 #include "windows.h"
 #endif // _WINDOWS || __WIN32__
 namespace gctl
 {
 	/**
 	 * @brief      Types of method that could be recognized by the lcg_solver() function.
 	 */
 	enum lcg_solver_type
 	{
 		/**
 		 * Conjugate gradient method.
 		 */
 		LCG_CG,
 		/**
 		 * Preconditioned conjugate gradient method.
 		 */
 		LCG_PCG,
 		/**
 		 * Conjugate gradient squared method.
 		 */
 		LCG_CGS,
 		/**
 		 * Biconjugate gradient method.
 		 */
 		LCG_BICGSTAB,
 		/**
 		 * Biconjugate gradient method with restart.
 		 */
 		LCG_BICGSTAB2,
 		/**
 		 * Conjugate gradient method with projected gradient for inequality constraints.
 		 * This algorithm comes without non-monotonic linear search for the step length.
 		 */
 		LCG_PG,
 		/**
 		 * Conjugate gradient method with spectral projected gradient for inequality constraints.
 		 * This algorithm comes with non-monotonic linear search for the step length.
 		 */
 		LCG_SPG,
 	};
 	/**
 	 * @brief      return value of the lcg_solver() function
 	 */
 	enum lcg_return_code
 	{
 		LCG_SUCCESS = 0, ///< The solver function terminated successfully.
 		LCG_CONVERGENCE = 0, ///< The iteration reached convergence.
 		LCG_STOP, ///< The iteration is stopped by the monitoring function.
 		LCG_ALREADY_OPTIMIZIED, ///< The initial solution is already optimized.
 		// A negative number means a error
 		LCG_UNKNOWN_ERROR = -1024, ///< Unknown error.
 		LCG_INVILAD_VARIABLE_SIZE, ///< The variable size is negative
 		LCG_INVILAD_MAX_ITERATIONS, ///< The maximal iteration times is negative.
 		LCG_INVILAD_EPSILON, ///< The epsilon is negative.
 		LCG_INVILAD_RESTART_EPSILON, ///< The restart epsilon is negative.
 		LCG_REACHED_MAX_ITERATIONS, ///< Iteration reached maximal limit.
 		LCG_NULL_PRECONDITION_MATRIX, ///< Null precondition matrix.
 		LCG_NAN_VALUE, ///< Nan value.
 		LCG_INVALID_POINTER, ///< Invalid pointer.
 		LCG_INVALID_LAMBDA, ///< Invalid range for lambda.
 		LCG_INVALID_SIGMA, ///< Invalid range for sigma.
 		LCG_INVALID_BETA, ///< Invalid range for beta.
 		LCG_INVALID_MAXIM, ///< Invalid range for maxi_m.
 		LCG_SIZE_NOT_MATCH, ///< Sizes of m and B do not match
 	};
 	/**
 	 * @brief    Message type of the LCG algorithms.
 	 * 
 	 */
 	enum lcg_message_type
 	{
 		LCG_THROW, ///< throw error only
 		LCG_ERROR, ///< display error only
 		LCG_SOLUTION, ///< display info for evry solution
 		LCG_ITERATION, ///< display info for every iteration
 	};
 	/**
 	 * @brief      Parameters of the conjugate gradient methods.
 	 */
 	struct lcg_para
 	{
 		/**
 		 * Maximal iteration times. The process will continue till the convergence is met
 		 * if this option is set to zero (default).
 		*/
 		int max_iterations;
 		/**
 		 * Epsilon for convergence test.
 		 * This parameter determines the accuracy with which the solution is to be 
 		 * found. A minimization terminates when ||g||/max(||g0||, 1.0) <= epsilon or 
 		 * sqrt(||g||)/N <= epsilon for the lcg_solver() function, where ||.|| denotes 
 		 * the Euclidean (L2) norm. The default value of epsilon is 1e-8.
 		*/
 		double epsilon;
 		/**
 		 * Whether to use absolute mean differences (AMD) between |Ax - B| to evaluate the process. 
 		 * The default value is false which means the gradient based evaluating method is used. 
 		 * The AMD based method will be used if this variable is set to true. This parameter is only 
 		 * applied to the non-constrained methods.
 		 */
 		int abs_diff;
 		/**
 		 * Restart epsilon for the LCG_BICGSTAB2 algorithm. The default value is 1e-6
 		 */
 		double restart_epsilon;
 		/**
 		 * Initial step length for the project gradient method. The default is 1.0
 		 */
 		double step;
 		/**
 		 * multiplier for updating solutions with the spectral projected gradient method. The range of
 		 * this variable is (0, 1). The default is given as 0.95
 		 */
 		double sigma;
 		/**
 		 * descending ratio for conducting the non-monotonic linear search. The range of
 		 * this variable is (0, 1). The default is given as 0.9
 		 */
 		double beta;
 		/**
 		 * The maximal record times of the objective values for the SPG method. The method use the 
 		 * objective values from the most recent maxi_m times to preform the non-monotonic linear search.
 		 * The default value is 10.
 		 */
 		int maxi_m;
 	};
 	/**
 	 * @brief This abstract class implements conjugate gradient algorithms for solving 
 	 * a linear system like Ax = B where A is a N*N matrix. As the actual variable 
 	 * we need is the product of 'Ax', the kernel matrix 'A' is not declared within 
 	 * the class definition. Instead, a pure virtual function is declared as the 
 	 * callback interface for calculating the product of 'Ax' as 'void LCG_Ax(const 
 	 * array<double> &x, array<double> &ax)'. A virtual function "int LCG_Progress(const 
 	 * array<double> &m, const double converge, const lcg_para &param, size_t t, 
 	 * std::ostream &ss)" could be reloaded for customed convergence tests.
 	 */
 	class lcg_solver
 	{
 	private:
 		lcg_para lcg_param_;
 		size_t lcg_inter_;
 		lcg_message_type lcg_msg_;
 		// make them class variables are more suitable for repetitively usages
 		array<double> zk, gk, dk, Adk;
 		array<double> rk, r0_T, pk, vk;
    	array<double> Apx, uk, qk, qk_m, wk;
 		array<double> m_new, gk_new;
    	array<double> sk, yk;
 		/**
 		 * @brief Display info of a given return code. This is a private function
 		 * and can only be called by other class functions.
 		 * 
 		 * @param err_code Input retrun code
 		 * @param ss Output stream of runtime info.
 		 */
 		void lcg_error_str(lcg_return_code err_code, std::ostream &ss);
 	public:
 		lcg_solver(); ///< default constructor
 		virtual ~lcg_solver(); ///< default de-constructor
 		/**
 		 * @brief Callback interface for calculating the product of 'A' multipled by an arbitrary vector 'x'.
 		 * 
 		 * @param x Multipler
 		 * @param ax Product of Ax
 		 */
 		virtual void LCG_Ax(const array<double> &x, array<double> &ax) = 0;
 		/**
 		 * @brief Callback interface for calculating the product of 'M' multipled by an arbitrary vector 'x'.
 		 * In which 'M' is the inverse of the pre-conditioning matrix. This function must be reloaded for the
 		 * LCG_PCG algorithm.
 		 * 
 		 * @param x Multipler
 		 * @param mx Product of Ax
 		 */
 		virtual void LCG_Mx(const array<double> &x, array<double> &mx);
 		/**
 		 * @brief Utility function for monitoring the solving process.
 		 * 
 		 * @param m Current solution
 		 * @param converge Current convergence
 		 * @param param Employed parameters
 		 * @param t Current iterative times
 		 * @param ss Output stream of runtime info.
 		 * @return Quit the solver if returned a non-zero value.
 		 */
 		virtual int LCG_Progress(const array<double> &m, const double converge, const lcg_para &param, size_t t, std::ostream &ss);
 		/**
 		 * @brief Set the lcg message object
 		 * 
 		 * @param msg Input message type.
 		 */
 		void set_lcg_message(lcg_message_type msg);
 		/**
 		 * @brief Set the lcg report intervals
 		 * 
 		 * @param inter Input reprot intervals.
 		 */
 		void set_lcg_report_interval(size_t inter);
 		/**
 		 * @brief Set the lcg para object
 		 * 
 		 * @param param Input lcg parameters.
 		 */
 		void set_lcg_para(const lcg_para &param);
 		/**
 		 * @brief Return a lcg_para object with default values
 		 * 
 		 * @return lcg_para
 		 */
 		lcg_para default_lcg_para();
 #ifdef GCTL_OPTIMIZATION_TOML
 		/**
 		 * @brief Set parameters of the conjugate gradient algorithms using a toml file. 
 		 * All parameter options must be listed under a top-level table 'lcg'. Available options 
 		 * under the 'lcg' table are as declared in the lcg_para structure.
 		 * 
 		 * @param toml_data Input toml data
 		 */
 		void set_lcg_para(std::string filename);
 		/**
 		 * @brief Set parameters of the conjugate gradient algorithms using a toml::value object. 
 		 * All parameter options must be listed under a top-level table 'lcg'. Available options 
 		 * under the 'lcg' table are as declared in the lcg_para structure.
 		 * 
 		 * @param toml_data Input toml data
 		 */
        void set_lcg_para(const toml::value &toml_data);
 #endif // GCTL_OPTIMIZATION_TOML
 		/**
 		 * @brief The allback interface for all CG algorithms. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param solver_id Selected solver type. 
 		 * @param ss Output stream of runtime info.
 		 */
 		void LCG_Minimize(array<double> &m, const array<double> &b, lcg_solver_type solver_id = LCG_CG, std::ostream &ss = std::clog);
 		/**
 		 * @brief The allback interface for all CG algorithms. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param solver_id Selected solver type.
 		 * @param low Lower bound of acceptable solutions.
 		 * @param hig Higher bound of acceptable solutions.
 		 * @param ss Output stream of runtime info.
 		 */
 		void LCG_MinimizeConstrained(array<double> &m, const array<double> &b, const array<double> &low, const array<double> &hig, lcg_solver_type solver_id = LCG_PG, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the CG algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lcg(array<double> &m, const array<double> &B, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the PCG algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lpcg(array<double> &m, const array<double> &B, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the CGS algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lcgs(array<double> &m, const array<double> &B, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the BICGSTAB algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lbicgstab(array<double> &m, const array<double> &B, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the BICGSTAB2 algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lbicgstab2(array<double> &m, const array<double> &B, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the PG algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param low Lower bound of acceptable solutions.
 		 * @param hig Higher bound of acceptable solutions.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lpg(array<double> &m, const array<double> &B, const array<double> &low, const array<double> &hig, std::ostream &ss = std::clog);
 		/**
 		 * @brief The standalone callback interface for the SPG algorithm. Set message type to LCG_THROW to suppresses all info outputs.
 		 * 
 		 * @param m Initial/Input solution.
 		 * @param B Right hand term of the system system.
 		 * @param low Lower bound of acceptable solutions.
 		 * @param hig Higher bound of acceptable solutions.
 		 * @param ss Output stream of runtime info.
 		 */
 		void lspg(array<double> &m, const array<double> &B, const array<double> &low, const array<double> &hig, std::ostream &ss = std::clog);
 	};
 }
 #endif // _GCTL_LCG_H
--- a/lib/optimization/lgd.cpp
+++ b/lib/optimization/lgd.cpp
@ -0,0 +1,505 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "lgd.h"
 /**
 * Default parameter for the Lévy-Gradient Descent (L-GD) method.
 */
 static const gctl::lgd_para lgd_defparam = {1000, 0, 1e-5, 1.0, 1.5, 0.01, 1e-8, -1.0};
 gctl::lgd_solver::lgd_solver()
 {
    lgd_param_ = lgd_defparam;
    lgd_inter_ = 1; lgd_ques_num_ = 0; lgd_trace_times_ = 0;
    lgd_silent_ = lgd_has_range_ = lgd_has_alpha_ = lgd_save_trace_ = false;
 }
 gctl::lgd_solver::~lgd_solver(){}
 int gctl::lgd_solver::LGD_Progress(const int curr_t, const double curr_fx, const double mean_fx, const double best_fx, const lgd_para &param)
 {
    if (lgd_silent_) return 0;
    if (param.epsilon > 0.0 && mean_fx <= param.epsilon)
    {
        std::clog << GCTL_CLEARLINE << "\rF(x) = " << curr_fx << ", Mean F(x) = " << mean_fx <<  ", Best F(x) = " << best_fx << ", Times = " << curr_t;
        return 0;
    }
    if (lgd_inter_ > 0 && curr_t%lgd_inter_ == 0)
    {
        std::clog << GCTL_CLEARLINE << "\rF(x) = " << curr_fx << ", Mean F(x) = " << mean_fx <<  ", Best F(x) = " << best_fx << ", Times = " << curr_t;
    }
    return 0;
 }
 void gctl::lgd_solver::lgd_silent()
 {
    lgd_silent_ = true;
    return;
 }
 void gctl::lgd_solver::set_lgd_report_interval(int inter)
 {
    lgd_inter_ = inter;
    return;
 }
 void gctl::lgd_solver::set_lgd_para(const lgd_para &in_param)
 {
    lgd_param_ = in_param;
    return;
 }
 #ifdef GCTL_OPTIMIZATION_TOML
 void gctl::lgd_solver::set_lgd_para(std::string filename)
 {
    toml::value toml_data;
    toml_data = toml::parse(filename);
    set_lgd_para(toml_data);
    return;
 }
 void gctl::lgd_solver::set_lgd_para(const toml::value &toml_data)
 {
    lgd_param_ = lgd_defparam;
    std::string LGD = "lgd";
 	if (toml_data.contains(LGD))
 	{
 		if (toml_data.at(LGD).contains("flight_times")) lgd_param_.flight_times = toml::find<int>(toml_data, LGD, "flight_times");
        if (toml_data.at(LGD).contains("batch"))        lgd_param_.batch = toml::find<int>(toml_data, LGD, "batch");
 		if (toml_data.at(LGD).contains("epsilon"))      lgd_param_.epsilon = toml::find<double>(toml_data, LGD, "epsilon");
 		if (toml_data.at(LGD).contains("stddev_v"))     lgd_param_.stddev_v = toml::find<double>(toml_data, LGD, "stddev_v");
 		if (toml_data.at(LGD).contains("beta"))         lgd_param_.beta = toml::find<double>(toml_data, LGD, "beta");
 		if (toml_data.at(LGD).contains("alpha"))        lgd_param_.alpha = toml::find<double>(toml_data, LGD, "alpha");
 		if (toml_data.at(LGD).contains("sigma"))        lgd_param_.sigma = toml::find<double>(toml_data, LGD, "sigma");
        if (toml_data.at(LGD).contains("lambda"))       lgd_param_.lambda = toml::find<double>(toml_data, LGD, "lambda");
 	}
    return;
 }
 #endif // GCTL_OPTIMIZATION_TOML
 void gctl::lgd_solver::set_lgd_record_trace()
 {
    lgd_save_trace_ = true;
    return;
 }
 void gctl::lgd_solver::show_solver()
 {
 	std::clog << "Solver's Setup Panel\n";
 	std::clog << "-----------------------------\n";
 	std::clog << "Solver: LGD\n";
 	std::clog << "Flights = " << lgd_param_.flight_times << ", Batch = " << lgd_param_.batch << ", Epsilon = " << lgd_param_.epsilon  << ", Lambda = " << lgd_param_.lambda << "\n";
 	std::clog << "STD(v) = " << lgd_param_.stddev_v << ", Beta = " << lgd_param_.beta << ", Alpha = " << lgd_param_.alpha << ", Sigma = " << lgd_param_.sigma << "\n";
 	std::clog << "=============================\n";
    return;
 }
 void gctl::lgd_solver::save_lgd_trace(std::string trace_file)
 {
    if (lgd_trace_times_ == 0)
    {
        GCTL_ShowWhatError("[gctl::lgd_solver] No trace is recorded.", GCTL_WARNING_ERROR, 0, 0, 0);
        return;
    }
    std::ofstream ofile;
    open_outfile(ofile, trace_file, ".txt");
    int m_size = lgd_trace_.size()/lgd_trace_times_;
    ofile << "# L-GD flight traces.\n";
    ofile << "# Each row represents an accepted solution.\n";
    ofile << "# Model size: " << m_size << "\n";
    ofile << "# Accepted solutions: " << lgd_trace_times_ << "\n";
    for (size_t i = 0; i < lgd_trace_times_; i++)
    {
        for (size_t j = 0; j < m_size; j++)
        {
            ofile << lgd_trace_[i*m_size+j] << " ";
        }
        ofile << "\n";
    }
    ofile.close();
    return;
 }
 void gctl::lgd_solver::lgd_error_str(lgd_return_code err_code, std::ostream &ss, bool err_throw)
 {
 #if defined _WINDOWS || __WIN32__
    if (!err_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_GREEN);
            ss << "Success! ";
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_RED);
            ss << "Fail! ";
        }
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[1m\033[32mLGD Success! ";
        else
            ss << "\033[1m\033[31mLGD Fail! ";
    }
 #endif
    std::string err_str;
    switch (err_code)
    {
        case LGD_CONVERGENCE:
            err_str = "The iteration has reached convergence."; break;
        case LGD_STOP:
            err_str = "The iteration is stopped by the progress monitoring function."; break;
        case LGD_REACHED_MAX_ITERATIONS:
            err_str = "The maximal flight times has been reached."; break;
        case LGD_INVALID_SOLUTION_SIZE:
            err_str = "Invalid solution size."; break;
        case LGD_INVALID_MAX_ITERATIONS:
            err_str = "Invalid flight times."; break;
        case LGD_INVALID_EPSILON:
            err_str = "Invalid epsilon value."; break;
        case LGD_INVALID_STDV:
            err_str = "Invalid STD value for generating the levy distribution."; break;
        case LGD_INVALID_BETA:
            err_str = "Invalid beta value."; break;
        case LGD_INVALID_ALPHA:
            err_str = "Invalid alpha value."; break;
        case LGD_INVALID_SIGMA:
            err_str = "Invalid sigma value."; break;
        case LGD_NAN_VALUE:
            err_str = "NaN values found."; break;
        default:
            err_str = "Unknown error."; break;
    }
    if (err_throw && err_code < 0) throw err_str;
    else ss << err_str;
 #if defined _WINDOWS || __WIN32__
    if (!err_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }	
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[0m" << std::endl;
        else
            ss << "\033[0m" << std::endl;
    }
 #endif
    return;
 }
 gctl::lgd_para gctl::lgd_solver::default_lgd_para()
 {
    lgd_para dp = lgd_defparam;
    return dp;
 }
 void gctl::lgd_solver::LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
    std::ostream &ss, bool verbose, bool err_throw)
 {
    if (lgd_silent_)
    {
        lgd_return_code ret = lgd(best_m, mean_m, std_m);
        if (ret < 0) lgd_error_str(ret, ss, true);
        return;
    }
    // 使用lcg求解 注意当我们使用函数指针来调用求解函数时默认参数不可以省略
 #ifdef GCTL_OPENMP
    double start = omp_get_wtime();
    lgd_return_code ret = lgd(best_m, mean_m, std_m);
    double end = omp_get_wtime();
    double costime = 1000*(end-start);
 #else
    clock_t start = clock();
    lgd_return_code ret = lgd(best_m, mean_m, std_m);
    clock_t end = clock();
    double costime = 1000*(end-start)/(double)CLOCKS_PER_SEC;
 #endif
    if (!err_throw) std::clog << std::endl << "Solver: LGD. Time cost: " << costime << " ms" << std::endl;
    if (verbose) lgd_error_str(ret, ss, err_throw);
    else if (ret < 0) lgd_error_str(ret, ss, err_throw);
    return;
 }
 void gctl::lgd_solver::LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
    const array<double> &alphas, std::ostream &ss, bool verbose, bool err_throw)
 {
    lgd_ques_num_ = best_m.size();
    if (lgd_ques_num_ != alphas.size())
    {
        throw std::runtime_error("[gctl::lgd_solver] arraies' size do not match.");
    }
    lgd_alpha_.resize(lgd_ques_num_);
    for (int i = 0; i < lgd_ques_num_; i++)
    {
        if (alphas[i] <= 0.0)
        {
            throw std::runtime_error("[gctl::lgd_solver] Invalid scaling value.");
        }
        lgd_alpha_[i] = alphas[i];
    }
    lgd_has_alpha_ = true;
    LGD_Minimize(best_m, mean_m, std_m, ss, verbose, err_throw);
    return;
 }
 void gctl::lgd_solver::LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
    const array<double> &lows, const array<double> &higs, std::ostream &ss, bool verbose, bool err_throw)
 {
    lgd_ques_num_ = best_m.size();
    if (lgd_ques_num_ != lows.size() || lgd_ques_num_ != higs.size())
    {
        throw std::runtime_error("[gctl::lgd_solver] arraies' size do not match.");
    }
    lgd_low_.resize(lgd_ques_num_);
    lgd_hig_.resize(lgd_ques_num_);
    for (int i = 0; i < lgd_ques_num_; i++)
    {
        if (lows[i] >= higs[i])
        {
            throw std::runtime_error("[gctl::lgd_solver] Invalid bound value.");
        }
        lgd_low_[i] = lows[i];
        lgd_hig_[i] = higs[i];
    }
    lgd_has_range_ = true;
    LGD_Minimize(best_m, mean_m, std_m, ss, verbose, err_throw);
    return;
 }
 void gctl::lgd_solver::LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
    double low, double hig, std::ostream &ss, bool verbose, bool err_throw)
 {
    if (low >= hig)
    {
        throw std::runtime_error("[gctl::lgd_solver] Invalid bound value.");
    }
    lgd_ques_num_ = best_m.size();
    lgd_low_.resize(lgd_ques_num_, low);
    lgd_hig_.resize(lgd_ques_num_, hig);
    lgd_has_range_ = true;
    LGD_Minimize(best_m, mean_m, std_m, ss, verbose, err_throw);
    return;
 }
 gctl::lgd_return_code gctl::lgd_solver::lgd(array<double> &best_m, array<double> &mean_m, array<double> &std_m)
 {
    lgd_ques_num_ = best_m.size();
    // check parameters
    if (lgd_ques_num_ <= 0) return LGD_INVALID_SOLUTION_SIZE;
    if (lgd_param_.flight_times <= 0) return LGD_INVALID_MAX_ITERATIONS;
    if (lgd_param_.epsilon <= 0) return LGD_INVALID_EPSILON;
    if (lgd_param_.stddev_v <= 0) return LGD_INVALID_STDV;
    if (lgd_param_.beta <= 1.0 || lgd_param_.beta >= 2.0) return LGD_INVALID_BETA;
    if (lgd_param_.alpha <= 0) return LGD_INVALID_ALPHA;
    if (lgd_param_.sigma <= 0) return LGD_INVALID_SIGMA;
    // initiate solutions
    mean_m.resize(lgd_ques_num_, 0.0); std_m.resize(lgd_ques_num_, 0.0);
    double gamma1 = tgamma(lgd_param_.beta + 1.0);
    double gamma2 = tgamma(0.5*(lgd_param_.beta + 1.0));
    double stddev_u = pow((gamma1*sin(0.5*GCTL_Pi*lgd_param_.beta)) / (gamma2*lgd_param_.beta*pow(2, 0.5*(lgd_param_.beta-1.0))), 1.0/lgd_param_.beta);
    unsigned seed = std::chrono::system_clock::now().time_since_epoch().count();
    std::default_random_engine generator(seed);
    std::normal_distribution<double> dist_u(0, stddev_u);
    std::normal_distribution<double> dist_v(0, lgd_param_.stddev_v);
    std::uniform_real_distribution<double> dist_s(1.0, 2.0);
    array<double> g, g_mem, g_orth, new_mean, b_m, alphas;
    g.resize(lgd_ques_num_); g_mem.resize(2*lgd_ques_num_); g_orth.resize(2*lgd_ques_num_);
    new_mean.resize(lgd_ques_num_); b_m.resize(lgd_ques_num_); alphas.resize(lgd_ques_num_);
    // 初始化参数变化范围为lgd_param_.alpha
    vecset(alphas, lgd_param_.alpha);
    if (lgd_has_range_)
    {
        vecdiff(alphas, lgd_hig_, lgd_low_);
        vecscale(alphas, lgd_param_.alpha);
    }
    if (lgd_has_alpha_)
    {
        veccpy(alphas, lgd_alpha_, lgd_param_.alpha);
    }
    double fx_best, fx_tmp, direct_mod, levy_length;
    double fx_mean = NAN;
    // 开始飞行
    int rcd_times = 0;
    lgd_trace_times_ = 0;
    for (int ft = 0; ft <= lgd_param_.flight_times; ft++)
    {
        // 计算尝试解
        fx_tmp = LGD_Evaluate(best_m, g);
        if (ft == 0 || fx_tmp < fx_best)
        {
            fx_best = fx_tmp;
            veccpy(b_m, best_m);
        }
        // 记录飞行轨迹
        if (lgd_param_.lambda <= 0.0 || (lgd_param_.lambda > 0.0 && fx_tmp <= lgd_param_.lambda))
        {
            for (int i = 0; i < lgd_ques_num_; i++)
            {
                std_m[i] = dynamic_stddev(std_m[i], rcd_times, mean_m[i], best_m[i], new_mean[i]);
                mean_m[i] = new_mean[i];
            }
            rcd_times++;
            if (lgd_save_trace_)
            {
                lgd_trace_.append_array(best_m);
                lgd_trace_times_++;
            }
        }
        if (LGD_Progress(ft, fx_tmp, fx_mean, fx_best, lgd_param_))
        {
            // 将迭代结果返还给m
            veccpy(best_m, b_m);
            return LGD_STOP;
        }
        if (lgd_param_.batch > 0 && (rcd_times+1)%lgd_param_.batch == 0)
        {
            fx_mean = LGD_Evaluate(mean_m, g);
            if (fx_mean < lgd_param_.epsilon)
            {
                LGD_Progress(ft, fx_tmp, fx_mean, fx_best, lgd_param_);
                // 将迭代结果返还给m
                veccpy(best_m, b_m);
                return LGD_CONVERGENCE;
            }
        }
        // 驻点检测
        direct_mod = sqrt(vecdot(g, g));
        if (direct_mod < lgd_param_.sigma)
        {
            if (ft == 0) // 初次飞行时无记录
            {
                do // 如果梯度消失 则采用一个随机方向
                {
                    for (int i = 0; i < lgd_ques_num_; i++)
                    {
                        g[i] = dist_s(generator);
                    }
                    direct_mod = sqrt(vecdot(g, g));
                }
                while (direct_mod < lgd_param_.sigma);
            }
            else // 如果梯度消失 则朝着上一次迭代方向的正交方向走一步
            {
                for (int i = 0; i < lgd_ques_num_; i++)
                {
                    g_mem[i+lgd_ques_num_] = dist_s(generator);
                }
                schmidt_orthogonal(g_mem, g_orth, 2);
                for (int i = 0; i < lgd_ques_num_; i++)
                {
                    g[i] = g_orth[i+lgd_ques_num_];
                }
                direct_mod = 1.0; // 此时的模量为单位模量
            }
        }
        // 莱维飞行的步长 注意原公式中无最外层绝对值符号
        // 这是我们需要步长的绝对值 因此取绝对值
        levy_length = fabs(dist_u(generator)/pow(fabs(dist_v(generator)), 1.0/lgd_param_.beta));
        for (int i = 0; i < lgd_ques_num_; i++)
        {
            best_m[i] -= levy_length*alphas[i]*g[i]/direct_mod;
        }
        if (!vecvalid(best_m))
        {
            return LGD_NAN_VALUE;
        }
        // 记录梯度方向
        for (int i = 0; i < lgd_ques_num_; i++)
        {
            g_mem[i] = g[i];
        }
        // 这里可以添加取值范围的约束
        if (lgd_has_range_)
        {
            vecbtm(best_m, lgd_low_);
            vectop(best_m, lgd_hig_);
        }
    }
    // 将迭代结果返还给m
    veccpy(best_m, b_m);
    return LGD_REACHED_MAX_ITERATIONS;
 }
--- a/lib/optimization/lgd.h
+++ b/lib/optimization/lgd.h
@ -0,0 +1,212 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_LGD_H
 #define _GCTL_LGD_H
 #include "gctl/core.h"
 #include "gctl/io.h"
 #include "gctl/maths.h"
 #include "gctl/algorithm.h"
 #include "gctl_optimization_config.h"
 #ifdef GCTL_OPTIMIZATION_TOML
 #include "toml.hpp"
 #endif // GCTL_OPTIMIZATION_TOML
 #if defined _WINDOWS || __WIN32__
 #include "windows.h"
 #endif // _WINDOWS || __WIN32__
 #ifdef GSTL_OPENMP
 #include "omp.h"
 #endif // GSTL_OPENMP
 namespace gctl
 {
 	/**
 	 * @brief      return value of the lgd_solver class.
 	 */
 	enum lgd_return_code
 	{
 		LGD_CONVERGENCE = 1, ///< The iteration reached convergence.
 		LGD_STOP, ///< The iteration stopped by the progress monitoring function.
 		LGD_REACHED_MAX_ITERATIONS, ///< Iteration reached max limit.
        LGD_INVALID_SOLUTION_SIZE = -1024, ///< Invalid solution size.
 		LGD_INVALID_MAX_ITERATIONS, ///< The maximal iteration times is negative.
        LGD_INVALID_EPSILON, ///< The epsilon is negative.
 		LGD_INVALID_STDV,
        LGD_INVALID_BETA, ///< Invalid value for beta.
        LGD_INVALID_ALPHA,
        LGD_INVALID_SIGMA,
 		LGD_NAN_VALUE, ///< Nan value.
 	};
    /**
     * @brief    Parameters of the L-GD method.
     */
    struct lgd_para
    {
        /**
         * Maximal times of the lévy flight. The iteration process will stop till the maximal 
         * flight times is reached unless the mean convergence test is set and satisfied. To 
         * active the test, set the 'batch' parameter which is shown as below. The default value 
         * is 1000.
         */
        int flight_times;
        /**
         * Batch size for the mean convergence test. This parameter determines the batch size, 
         * in recorded solutions, to compute the value of the objective function. Note that 
         * only qualified solutions will be recorded for analyzing if the 'lambda' parameter is 
         * set. The library does not perform the mean convergence test if the value of this 
         * parameter is zero. The default is 0.
         */
        int batch;
        /**
         * Epsilon for the mean convergence test. This parameter determines the accuracy 
         * with which the mean solution is to be found. The default is 1e-5.
         */
        double epsilon;
        /**
         * Standard deviation of v that is used to calculate the distance of each
         * lévy flight in length = stddev_u/|stddev_v|^{1/beta}. This parameter is 
         * typically given as 1.0.
         */
        double stddev_v;
        /**
         * Scale parameter for calculating stddev_u and the flying length. Must be at 
         * (1.0, 2.0). The default value is 1.5. The bigger beta is the smaller of the 
         * range of flying length gets.
         */
        double beta;
        /**
         * Scale parameter multiplied by the flying length. The default value is 0.01. 
         * The parameter should be set according to the expected convergence speed. Normally, 
         * The bigger alpha is, the faster the L-GD convergences. However, the L-GD may 
         * miss the optimized solutions if alpha was too big.
         */
        double alpha;
        /**
         * Sigma for the stagnation point test. The algorithm will take one search 
         * orthogonal with the last iteration if the module of the gradients is smaller 
         * than sigma. This mechanism helps the algorithm escaping from stagnation 
         * points such as local minimal or saddle points.The default is 1e-8.
         */
        double sigma;
        /**
         * Threshold for recording the search paths. If the value is bigger then zero, then
         * only values of the objective function that are smaller to equal to the threshold be 
         * used for statistic analyzing. Otherwise, all records will be used. The recorded paths 
         * could be save to file using the save_lgd_trace(string) function if set_lgd_record_trace() 
         * is set. The default is -1.0.
         */
        double lambda;
    };
    class lgd_solver
    {
    public:
        lgd_solver(); ///< Default constructor.
        virtual ~lgd_solver(); ///< Default de-constructor.
        /**
         * @brief Interface for the evaluation of the objective function. Concrete 
         * contents of this function is determined according to the optimizing problem. 
         * 
         * @param x Inputs of the current solution.
         * @param g Outputs of the model gradient calculated using the input solution.
         * @return Current objective value.
         */
        virtual double LGD_Evaluate(const array<double> &x, array<double> &g) = 0;
        /**
         * @brief Default monitoring function of the optimizing process. 
         * 
         * @param best_fx Objective value of the best solution. 
         * @param curr_fx Objective value of the current solution.
         * @param mean_fx Objective value of the mean solution.
         * @param param L-GD's parameters used for the optimzing process.
         * @param curr_t Current flight times.
         * @return The optimizing process will be stopped if a non-zero value is returned.
         */
        virtual int LGD_Progress(const int curr_t, const double curr_fx, const double mean_fx, 
            const double best_fx, const lgd_para &param);
        void lgd_silent();
        void set_lgd_report_interval(int inter);
        void show_solver();
        void set_lgd_record_trace(); ///< Turn on the recording of fight traces.
        // Save fight traces to file. Not that only qualified solutions will be 
        // saved if the recording threshold is set. 
        void save_lgd_trace(std::string trace_file);
        lgd_para default_lgd_para();
        void set_lgd_para(const lgd_para &param);
 #ifdef GCTL_OPTIMIZATION_TOML
        void set_lgd_para(std::string filename);
        void set_lgd_para(const toml::value &toml_data);
 #endif // GCTL_OPTIMIZATION_TOML
        void LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
            std::ostream &ss = std::clog, bool verbose = true, bool err_throw = false);
        void LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
            const array<double> &alphas, std::ostream &ss = std::clog, 
            bool verbose = true, bool err_throw = false);
        void LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
            const array<double> &lows, const array<double> &higs, std::ostream &ss = std::clog, 
            bool verbose = true, bool err_throw = false);
        void LGD_Minimize(array<double> &best_m, array<double> &mean_m, array<double> &std_m, 
            double low, double hig, std::ostream &ss = std::clog, bool verbose = true, 
            bool err_throw = false);
    private:
        void lgd_error_str(lgd_return_code err_code, std::ostream &ss = std::clog, bool err_throw = false);
        lgd_return_code lgd(array<double> &best_m, array<double> &mean_m, array<double> &std_m);
    private:
        lgd_para lgd_param_;
        int lgd_inter_, lgd_ques_num_, lgd_trace_times_;
        bool lgd_silent_, lgd_has_range_, lgd_has_alpha_, lgd_save_trace_;
        array<double> lgd_low_, lgd_hig_, lgd_alpha_, lgd_trace_;
    };
 }
 #endif // _GCTL_LGD_H
--- a/lib/optimization/loss_func.cpp
+++ b/lib/optimization/loss_func.cpp
@ -0,0 +1,100 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2023  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "loss_func.h"
 gctl::loss_func::loss_func()
 {
    uncer_type_ = 0;
 }
 gctl::loss_func::loss_func(const array<double> &tar, norm_type_e n_type)
 {
    uncer_type_ = 0;
    init(tar, n_type);
 }
 gctl::loss_func::~loss_func(){}
 void gctl::loss_func::init(const array<double> &tar, norm_type_e n_type)
 {
    tar_num_ = tar.size();
    tars_ = tar;
    norm_type_ = n_type;
    return;
 }
 void gctl::loss_func::set_uncertainty(double uncer)
 {
    uncer_type_ = 1;
    uncer_ = uncer;
    return;
 }
 void gctl::loss_func::set_uncertainty(const array<double> &uncer)
 {
    uncer_type_ = 2;
    uncers_ = uncer;
    return;
 }
 double gctl::loss_func::get_loss()
 {
    double l = loss_;
    loss_ = 0.0;
    return l;
 }
 double gctl::loss_func::evaluate(double inp, int id)
 {
    double val = (inp - tars_[id]);
    if (uncer_type_ == 1) val /= uncer_;
    else if (uncer_type_ == 2) val /= uncers_[id];
    if (norm_type_ == L1) val = fabs(val);
    if (norm_type_ == L2) val = val*val;
    loss_ += val;
    return val/tar_num_;
 }
 double gctl::loss_func::gradient(double inp, int id)
 {
    double c;
    if (uncer_type_ == 1) c = uncer_;
    else if (uncer_type_ == 2) c = uncers_[id];
    double val = (inp - tars_[id]);
    if (norm_type_ == L1 && val >= 0) val = 1.0;
    if (norm_type_ == L1 && val < 0)  val = -1.0;
    if (norm_type_ == L2) val = 2.0*val;
    if (norm_type_ == L1 && uncer_type_ != 0) val /= c;
    else if (norm_type_ == L2 && uncer_type_ != 0) val /= (c*c);
    return val/tar_num_;
 }
--- a/lib/optimization/loss_func.h
+++ b/lib/optimization/loss_func.h
@ -0,0 +1,61 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2023  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_LOSS_FUNC_H
 #define _GCTL_LOSS_FUNC_H
 // library's head files
 #include "gctl/core.h"
 namespace gctl
 {
    class loss_func
    {
    public:
        loss_func();
        loss_func(const array<double> &tar, norm_type_e n_type);
        virtual ~loss_func();
        void init(const array<double> &tar, norm_type_e n_type);
        void set_uncertainty(double uncer);
        void set_uncertainty(const array<double> &uncer);
        double get_loss();
        double evaluate(double inp, int id);
        double gradient(double inp, int id);
    private:
        //unsigned int counter_;
        unsigned int tar_num_;
        int uncer_type_;
        double uncer_, loss_;
        norm_type_e norm_type_;
        array<double> tars_;
        array<double> uncers_;
    };
 }
 #endif // _GCTL_LOSS_FUNC_H
--- a/lib/optimization/lu.cpp
+++ b/lib/optimization/lu.cpp
@ -0,0 +1,152 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "lu.h"
 gctl::lu::lu(matrix<double> &sourceMatrix) : decomposedMatrix(sourceMatrix)
 {
    if (sourceMatrix.empty() || sourceMatrix.row_size() != sourceMatrix.col_size())
    {
        throw domain_error("Invalid input matrix. From lu::lu(...)");
    }
 }
 // Decomposition into triangular matrices
 void gctl::lu::decompose()
 {
    // Initialize the permutation vector
    int n = decomposedMatrix.row_size();
    rowPermutation.resize(n);
    for (int i = 0; i < n; i++)
    {
        rowPermutation[i] = i;
    }
    // LU factorization
    double tmp, det = 1.0;       
    for (int p = 1; p <= n - 1; p++) 
    {
        // Find pivot element.
        for (int i = p + 1; i <= n; i++) 
        {
            if (std::fabs(decomposedMatrix[rowPermutation[i - 1]][p - 1]) > std::fabs(decomposedMatrix[rowPermutation[p - 1]][p - 1]))
            {
                // Switch the index for the p-1 pivot row if necessary.
                tmp = rowPermutation[p - 1]; rowPermutation[p - 1] = rowPermutation[i - 1]; rowPermutation[i - 1] = tmp;
                det = -det;
            }
        }
        if (decomposedMatrix[rowPermutation[p - 1]][p - 1] == 0.0)
        {
            // The matrix is singular, at least to precision of algorithm
            throw runtime_error("The input matrix is singular. From gctl::lu::decompose()");
            return;
        }
        // Multiply the diagonal elements.
        det = det * decomposedMatrix[rowPermutation[p - 1]][p - 1];
        // Form multiplier.
        for (int i = p + 1; i <= n; i++)
        {
            decomposedMatrix[rowPermutation[i - 1]][p - 1] /= decomposedMatrix[rowPermutation[p - 1]][p - 1];
            // Eliminate [p-1].
            for (int j = p + 1; j <= n; j++)
            {
                decomposedMatrix[rowPermutation[i - 1]][j - 1] -= decomposedMatrix[rowPermutation[i - 1]][p - 1] * decomposedMatrix[rowPermutation[p - 1]][j - 1];
            }
        }
    }
    det = det * decomposedMatrix[rowPermutation[n - 1]][n - 1];
    if (det == 0.0)
    {
            throw runtime_error("Determinant of the input matrix is zero. From gctl::lu::decompose()");
    }
    return;
 }
 // solve for x in form Ax = b.  A is the original input matrix.
 // Note: b is modified in-place for row permutations
 void gctl::lu::solve(const array<double>& b, array<double> &x)
 {
    // Our decomposed matrix is comprised of both the lower and upper diagonal matrices.
    // The rows of this matrix have been permutated during the decomposition process.  The
    // rowPermutation indicates the proper row order.
    // The lower diagonal matrix only include elements below the diagonal with diagonal 
    // elements set to 1.
    // The upper diagonal matrix is fully specified.
    // First solve Ly = Pb for x using forward substitution. P is a permutated identity matrix.
    if (b.empty())
    {
        throw domain_error("Invalid target vector. From gctl::lu::solve(...)");
    }
    x.resize(b.size());
    for (int i = 0; i < x.size(); i++)
    {
        int currentRow = rowPermutation[i];
        double sum = 0.0;
        for (int j = 0; j < i; j++)
        {
            sum += (decomposedMatrix[currentRow][j] * x[j]);
        }
        x[i] = (b[currentRow] - sum);
    }
    // Now solve Uy = x for y using back substitution.  Note that 
    // y can be solved in place using the existing y vector.  No need
    // to allocate another vector.
    for (int i = b.size()-1; i >= 0; i--)
    {
        int currentRow = rowPermutation[i];
        double sum = 0.0;
        for (int j = b.size()-1; j > i; j--)
        {
            sum += (decomposedMatrix[currentRow][j] * x[j]);
        }
        x[i] = (x[i] - sum) / decomposedMatrix[currentRow][i];
    }
    return;
 }
--- a/lib/optimization/lu.h
+++ b/lib/optimization/lu.h
@ -0,0 +1,56 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_LU_H
 #define _GCTL_LU_H
 #include "gctl/core.h"
 namespace gctl
 {
    /**
     * @brief      Lower/upper decomposition of matrix into a lower triangular matrix and a upper triangular matrix.
     *
     * @tparam     T     template type
     */
    class lu
    {
    public:
        lu(matrix<double> &sourceMatrix); // Matrix is decomposed in-place
        virtual ~lu(){}
        void decompose(); ///< Decomposition into triangular matrices. Return false if failed
        void solve(const array<double>& b, array<double> &x); ///< solve for x in form Ax = b.  A is the original input matrix.
    protected:
        lu(const lu&) = delete;    
        void operator=(const lu&) = delete;
        matrix<double> &decomposedMatrix; // Output matrix after decomposition
        array<int> rowPermutation; // Permutation of rows during pivoting
    };
 }
 #endif // _GCTL_LU_H
--- a/lib/optimization/sgd.cpp
+++ b/lib/optimization/sgd.cpp
@ -0,0 +1,634 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "sgd.h"
 /**
 * Default parameter for the SGD methods.
 */
 static const gctl::sgd_para sgd_defparam = {0, 1e-6, 0.01, 0.01, 0.9, 0.999, 1e-8};
 gctl::sgd_solver::sgd_solver()
 {
    sgd_param_ = sgd_defparam;
    sgd_inter_ = 1;
    sgd_silent_ = false;
 	solver_name_ = "Undefined";
 }
 gctl::sgd_solver::~sgd_solver(){}
 int gctl::sgd_solver::SGD_Progress(double fx, const array<double> &x, const sgd_para &param, const int k)
 {
    if (sgd_silent_) return 0;
    if (param.epsilon > 0.0 && fx <= param.epsilon)
    {
    	std::clog << GCTL_CLEARLINE << "\rF(x) = " << fx << ", Train-Times = " << k;
        return 0;
    }
    if (sgd_inter_ > 0 && k%sgd_inter_ == 0)
    {
    	std::clog << GCTL_CLEARLINE << "\rF(x) = " << fx << ", Train-Times = " << k;
    }
    return 0;
 }
 void gctl::sgd_solver::sgd_silent()
 {
    sgd_silent_ = true;
    return;
 }
 void gctl::sgd_solver::set_sgd_report_interval(int inter)
 {
    sgd_inter_ = inter;
    return;
 }
 void gctl::sgd_solver::set_sgd_para(const sgd_para &in_param)
 {
    sgd_param_ = in_param;
    return;
 }
 void gctl::sgd_solver::set_sgd_para(const toml::value &toml_data)
 {
    sgd_param_ = sgd_defparam;
    std::string SGD = "sgd";
 	if (toml_data.contains(SGD))
 	{
 		if (toml_data.at(SGD).contains("iteration")) sgd_param_.iteration = toml::find<int>(toml_data, SGD, "iteration");
 		if (toml_data.at(SGD).contains("epsilon"))   sgd_param_.epsilon = toml::find<double>(toml_data, SGD, "epsilon");
        if (toml_data.at(SGD).contains("mu"))        sgd_param_.mu = toml::find<double>(toml_data, SGD, "mu");
 		if (toml_data.at(SGD).contains("alpha"))     sgd_param_.alpha = toml::find<double>(toml_data, SGD, "alpha");
 		if (toml_data.at(SGD).contains("beta_1"))    sgd_param_.beta_1 = toml::find<double>(toml_data, SGD, "beta_1");
 		if (toml_data.at(SGD).contains("beta_2"))    sgd_param_.beta_2 = toml::find<double>(toml_data, SGD, "beta_2");
 		if (toml_data.at(SGD).contains("sigma"))     sgd_param_.sigma = toml::find<double>(toml_data, SGD, "sigma");
 	}
    return;
 }
 void gctl::sgd_solver::show_solver()
 {
 	std::clog << "Solver's Setup Panel\n";
 	std::clog << "-----------------------------\n";
 	std::clog << "Solver: " << solver_name_ << "\n";
 	std::clog << "Iteration = " << sgd_param_.iteration << ", Epsilon = " << sgd_param_.epsilon << ", Mu = " << sgd_param_.mu << "\n";
 	std::clog << "Alpha = " << sgd_param_.alpha << ", Beta1 = " << sgd_param_.beta_1 << ", Beta2 = " << sgd_param_.beta_2 << ", Sigma = " << sgd_param_.sigma << "\n";
 	std::clog << "=============================\n";
 	return;
 }
 void gctl::sgd_solver::sgd_error_str(sgd_return_code err_code, std::ostream &ss, bool err_throw)
 {
 #if defined _WINDOWS || __WIN32__
    if (!err_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_GREEN);
            ss << "Success! ";
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), FOREGROUND_INTENSITY | FOREGROUND_RED);
            ss << "Fail! ";
        }
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[1m\033[32mSGD Success! ";
        else
            ss << "\033[1m\033[31mSGD Fail! ";
    }
 #endif
    std::string err_str;
    switch (err_code)
    {
        case SGD_SUCCESS:
 			err_str = "Success."; break;
 		case SGD_CONVERGENCE:
 			err_str = "The iteration reached convergence."; break;
 		case SGD_STOP:
 			err_str = "The iteration stopped by the progress evaluation function."; break;
 		case SGD_UNKNOWN_ERROR:
 			err_str = "Unknown error."; break;
 		case SGD_INVALID_VARIABLE_SIZE:
 			err_str = "Invalid array size."; break;
 		case SGD_REACHED_MAX_ITERATIONS:
 			err_str = "The maximal iteration is reached."; break;
 		case SGD_INVALID_EPSILON:
 			err_str = "Invalid value for epsilon."; break;
 		case SGD_INVALID_BETA:
 			err_str = "Invalid value for beta."; break;
 		case SGD_INVALID_MU:
 			err_str = "Invalid value for mu."; break;
 		case SGD_INVALID_ALPHA:
 			err_str = "Invalid value for alpha."; break;
 		case SGD_INVALID_SIGMA:
 			err_str = "Invalid value for sigma."; break;
 		case SGD_NAN_VALUE:
 			err_str = "NaN values found."; break;
 		default:
 			err_str = "Unknown error."; break;
    }
    if (err_throw && err_code < 0) throw err_str;
    else ss << err_str;
 #if defined _WINDOWS || __WIN32__
    if (!err_throw)
    {
        if (err_code >= 0)
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }
        else
        {
            SetConsoleTextAttribute(GetStdHandle(STD_ERROR_HANDLE), 7);
            ss << std::endl;
        }	
    }
 #else
    if (!err_throw)
    {
        if (err_code >= 0)
            ss << "\033[0m" << std::endl;
        else
            ss << "\033[0m" << std::endl;
    }
 #endif
    return;
 }
 gctl::sgd_para gctl::sgd_solver::default_sgd_para()
 {
    sgd_para dp = sgd_defparam;
    return dp;
 }
 void gctl::sgd_solver::SGD_Minimize(array<double> &m, sgd_solver_type solver_id, std::ostream &ss, bool verbose, bool err_throw)
 {
    if (sgd_silent_)
    {
        sgd_return_code ret;
        if (solver_id == MOMENTUM)       {solver_name_ = "MOMENTUM";  ret = momentum(m);}
        else if (solver_id == NAG)       {solver_name_ = "NAG";       ret = nag(m);}
        else if (solver_id == ADAGRAD)   {solver_name_ = "ADAGRAD";   ret = adagrad(m);}
        else if (solver_id == RMSPROP)   {solver_name_ = "RMSPROP";   ret = rmsprop(m);}
        else if (solver_id == ADAM)      {solver_name_ = "ADAM";      ret = adam(m);}
        else if (solver_id == NADAM)     {solver_name_ = "NADAM";     ret = nadam(m);}
        else if (solver_id == ADAMAX)    {solver_name_ = "ADAMAX";    ret = adamax(m);}
        else if (solver_id == ADABELIEF) {solver_name_ = "ADABELIEF"; ret = adabelief(m);}
        else throw std::invalid_argument("Invalid solver type. gstl::sgd_solver::SGD_Minimize(...)");
        if (ret < 0) sgd_error_str(ret, ss, true);
        return;
    }
    // 使用lcg求解 注意当我们使用函数指针来调用求解函数时默认参数不可以省略
 #ifdef GCTL_OPENMP
    double start = omp_get_wtime();
    sgd_return_code ret;
    if (solver_id == MOMENTUM)       {solver_name_ = "MOMENTUM";  ret = momentum(m);}
 	else if (solver_id == NAG)       {solver_name_ = "NAG";       ret = nag(m);}
 	else if (solver_id == ADAGRAD)   {solver_name_ = "ADAGRAD";   ret = adagrad(m);}
 	else if (solver_id == RMSPROP)   {solver_name_ = "RMSPROP";   ret = rmsprop(m);}
 	else if (solver_id == ADAM)      {solver_name_ = "ADAM";      ret = adam(m);}
 	else if (solver_id == NADAM)     {solver_name_ = "NADAM";     ret = nadam(m);}
 	else if (solver_id == ADAMAX)    {solver_name_ = "ADAMAX";    ret = adamax(m);}
 	else if (solver_id == ADABELIEF) {solver_name_ = "ADABELIEF"; ret = adabelief(m);}
 	else throw std::invalid_argument("Invalid solver type. gstl::sgd_solver::SGD_Minimize(...)");
    double end = omp_get_wtime();
    double costime = 1000*(end-start);
 #else
    clock_t start = clock();
    sgd_return_code ret;
    if (solver_id == MOMENTUM)       {solver_name_ = "MOMENTUM";  ret = momentum(m);}
 	else if (solver_id == NAG)       {solver_name_ = "NAG";       ret = nag(m);}
 	else if (solver_id == ADAGRAD)   {solver_name_ = "ADAGRAD";   ret = adagrad(m);}
 	else if (solver_id == RMSPROP)   {solver_name_ = "RMSPROP";   ret = rmsprop(m);}
 	else if (solver_id == ADAM)      {solver_name_ = "ADAM";      ret = adam(m);}
 	else if (solver_id == NADAM)     {solver_name_ = "NADAM";     ret = nadam(m);}
 	else if (solver_id == ADAMAX)    {solver_name_ = "ADAMAX";    ret = adamax(m);}
 	else if (solver_id == ADABELIEF) {solver_name_ = "ADABELIEF"; ret = adabelief(m);}
 	else throw std::invalid_argument("Invalid solver type. gstl::sgd_solver::SGD_Minimize(...)");
    clock_t end = clock();
    double costime = 1000*(end-start)/(double)CLOCKS_PER_SEC;
 #endif
    if (!err_throw)
    {
        std::clog << std::endl;
        switch (solver_id)
        {
            case MOMENTUM:
                std::clog << "Solver: MOMENTUM. Time cost: " << costime << " ms" << std::endl;
                break;
            case NAG:
                std::clog << "Solver: NAG. Time cost: " << costime << " ms" << std::endl;
                break;
            case ADAGRAD:
                std::clog << "Solver: ADAGRAD. Time cost: " << costime << " ms" << std::endl;
                break;
            case RMSPROP:
                std::clog << "Solver: RMSPROP. Time cost: " << costime << " ms" << std::endl;
                break;
            case ADAM:
                std::clog << "Solver: ADAM. Time cost: " << costime << " ms" << std::endl;
                break;
            case NADAM:
                std::clog << "Solver: NADAM. Time cost: " << costime << " ms" << std::endl;
                break;
            case ADAMAX:
                std::clog << "Solver: ADAMAX. Time cost: " << costime << " ms" << std::endl;
                break;
            case ADABELIEF:
                std::clog << "Solver: ADABELIEF. Time cost: " << costime << " ms" << std::endl;
                break;
            default:
                std::clog << "Solver: Unknown. Time cost: " << costime << " ms" << std::endl;
                break;
        }	
    }
    if (verbose) sgd_error_str(ret, ss, err_throw);
    else if (ret < 0) sgd_error_str(ret, ss, err_throw);
    return;
 }
 gctl::sgd_return_code gctl::sgd_solver::momentum(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.mu < 0 || sgd_param_.mu >= 1.0) return SGD_INVALID_MU;
 	array<double> mk(n_size, 0.0);
 	array<double> g(n_size);
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		for (int i = 0; i < n_size; i++)
 		{
 			mk[i] = sgd_param_.mu*mk[i] + g[i];
 			m[i] = m[i] - sgd_param_.alpha * mk[i];
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::nag(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.mu < 0 || sgd_param_.mu >= 1.0) return SGD_INVALID_MU;
 	array<double> mk(n_size, 0.0);
 	array<double> xk(n_size);
 	array<double> g (n_size);
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		for (int i = 0; i < n_size; i++)
 		{
 			xk[i] = m[i] - sgd_param_.mu*sgd_param_.alpha*mk[i];
 		}
 		fx = SGD_Evaluate(xk, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		for (int i = 0; i < n_size; i++)
 		{
 			mk[i] = sgd_param_.mu*mk[i] + g[i];
 			m[i] = m[i] - sgd_param_.alpha * mk[i];
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::adagrad(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0.0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> mk(n_size, 0.0);
 	array<double> g (n_size);
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		for (int i = 0; i < n_size; i++)
 		{
 			mk[i] = mk[i] + g[i]*g[i];
 			m[i] = m[i] - sgd_param_.alpha * g[i]/(sqrt(mk[i]) + sgd_param_.sigma);
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::rmsprop(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0.0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> vk(n_size, 0.0);
 	array<double> g (n_size);
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		for (int i = 0; i < n_size; i++)
 		{
 			vk[i] = sgd_param_.beta_2 * vk[i] + (1.0 - sgd_param_.beta_2)*g[i]*g[i];
 			m[i] = m[i] - sgd_param_.alpha * g[i]/(sqrt(vk[i]) + sgd_param_.sigma);
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::adam(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.alpha < 0) return SGD_INVALID_ALPHA;
 	if (sgd_param_.beta_1 < 0.0 || sgd_param_.beta_1 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.beta_2 < 0.0 || sgd_param_.beta_2 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> mk(n_size, 0.0);
 	array<double> vk(n_size, 0.0);
 	array<double> g (n_size);
 	double beta_1t = 1.0, beta_2t = 1.0;
 	double alpha_k;
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		beta_1t *= sgd_param_.beta_1;
 		beta_2t *= sgd_param_.beta_2;
 		alpha_k = sgd_param_.alpha * sqrt(1.0 - beta_2t)/(1.0 - beta_1t);
 		int i;
 #pragma omp parallel for private (i) schedule(guided)
        for (i = 0; i < n_size; i++)
        {
            mk[i] = sgd_param_.beta_1*mk[i] + (1.0 - sgd_param_.beta_1)*g[i];
            vk[i] = sgd_param_.beta_2*vk[i] + (1.0 - sgd_param_.beta_2)*g[i]*g[i];
            m[i] = m[i] - alpha_k * mk[i]/(sqrt(vk[i]) + sgd_param_.sigma);
            //if (m[i] != m[i]) return SGD_NAN_VALUE;
        }
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::nadam(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.alpha < 0) return SGD_INVALID_ALPHA;
 	if (sgd_param_.beta_1 < 0.0 || sgd_param_.beta_1 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.beta_2 < 0.0 || sgd_param_.beta_2 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> mk(n_size, 0.0);
 	array<double> mk_hat(n_size);
 	array<double> nk(n_size, 0.0);
 	array<double> nk_hat(n_size);
 	array<double> g (n_size);
 	array<double> g_hat(n_size);
 	double beta_1t = 1.0, beta_1t1 = sgd_param_.beta_1, beta_2t = 1.0;
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		beta_1t  *= sgd_param_.beta_1;
 		beta_1t1 *= sgd_param_.beta_1;
 		beta_2t  *= sgd_param_.beta_2;
 		for (int i = 0; i < n_size; i++)
 		{
 			g_hat[i] = g[i]/(1.0 - beta_1t);
 			mk[i] = sgd_param_.beta_1*mk[i] + (1.0 - sgd_param_.beta_1)*g[i];
 			nk[i] = sgd_param_.beta_2*nk[i] + (1.0 - sgd_param_.beta_2)*g[i]*g[i];
 			mk_hat[i] = mk[i]/(1.0 - beta_1t1);
 			nk_hat[i] = nk[i]/(1.0 - beta_2t);
 			m[i] = m[i] - sgd_param_.alpha * ((1.0 - beta_1t)*g_hat[i] 
 				+ beta_1t1*mk_hat[i])/(sqrt(nk_hat[i]) + sgd_param_.sigma);
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::adamax(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.alpha < 0) return SGD_INVALID_ALPHA;
 	if (sgd_param_.beta_1 < 0.0 || sgd_param_.beta_1 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.beta_2 < 0.0 || sgd_param_.beta_2 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> mk(n_size, 0.0);
 	array<double> vk(n_size, 0.0);
 	array<double> g (n_size);
 	double beta_1t = 1.0;
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		beta_1t *= sgd_param_.beta_1;
 		for (int i = 0; i < n_size; i++)
 		{
 			mk[i] = sgd_param_.beta_1*mk[i] + (1.0 - sgd_param_.beta_1)*g[i];
 			vk[i] = std::max(sgd_param_.beta_2*vk[i], std::fabs(g[i]));
 			m[i] = m[i] - sgd_param_.alpha * mk[i]/((1.0 - beta_1t)*vk[i]);
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
 gctl::sgd_return_code gctl::sgd_solver::adabelief(array<double> &m)
 {
    int n_size = m.size();
 	//check parameters
 	if (n_size <= 0) return SGD_INVALID_VARIABLE_SIZE;
 	if (sgd_param_.epsilon < 0) return SGD_INVALID_EPSILON;
 	if (sgd_param_.alpha < 0) return SGD_INVALID_ALPHA;
 	if (sgd_param_.beta_1 < 0.0 || sgd_param_.beta_1 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.beta_2 < 0.0 || sgd_param_.beta_2 >= 1.0) return SGD_INVALID_BETA;
 	if (sgd_param_.sigma < 0.0) return SGD_INVALID_SIGMA;
 	array<double> mk(n_size, 0.0);
 	array<double> vk(n_size, 0.0);
 	array<double> g (n_size);
 	double beta_1t = 1.0, beta_2t = 1.0;
 	double alpha_k;
 	int t = 0;
 	double fx;
 	while (1)
 	{
 		fx = SGD_Evaluate(m, g);
 		if (SGD_Progress(fx, m, sgd_param_, t)) return SGD_STOP;
 		if (fx < sgd_param_.epsilon) return SGD_CONVERGENCE;
 		beta_1t *= sgd_param_.beta_1;
 		beta_2t *= sgd_param_.beta_2;
 		alpha_k = sgd_param_.alpha * sqrt(1.0 - beta_2t)/(1.0 - beta_1t);
 		for (int i = 0; i < n_size; i++)
 		{
 			mk[i] = sgd_param_.beta_1*mk[i] + (1.0 - sgd_param_.beta_1)*g[i];
 			vk[i] = sgd_param_.beta_2*vk[i] + (1.0 - sgd_param_.beta_2)*(g[i] - mk[i])*(g[i] - mk[i]);
 			m[i] = m[i] - alpha_k * mk[i]/(sqrt(vk[i]) + sgd_param_.sigma);
 			if (m[i] != m[i]) return SGD_NAN_VALUE;
 		}
 		t++;
 		if (sgd_param_.iteration > 0 && t >= sgd_param_.iteration) break;
 	}
 	return SGD_REACHED_MAX_ITERATIONS;
 }
--- a/lib/optimization/sgd.h
+++ b/lib/optimization/sgd.h
@ -0,0 +1,201 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_SGD_H
 #define _GCTL_SGD_H
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 #include "gctl_optimization_config.h"
 #ifdef GCTL_OPTIMIZATION_TOML
 #include "toml.hpp"
 #endif // GCTL_OPTIMIZATION_TOML
 #if defined _WINDOWS || __WIN32__
 #include "windows.h"
 #endif // _WINDOWS || __WIN32__
 #ifdef GSTL_OPENMP
 #include "omp.h"
 #endif // GSTL_OPENMP
 namespace gctl
 {
    /**
     * @brief      Types of method that could be recognized by the sgd_solver() function.
     */
    enum sgd_solver_type
    {
        /**
         * Classic momentum.
         */
        MOMENTUM,
        /**
         * Nesterov’s accelerated gradient (NAG)
         */
        NAG,
        /**
         * AdaGrad method.
         */
        ADAGRAD,
        /**
         * RMSProp method.
         */
        RMSPROP,
        /**
         * Adam method.
         */
        ADAM,
        /**
         * Nadam method.
         */
        NADAM,
        /**
         * AdaMax method.
         */
        ADAMAX,
        /**
         * AdaBelief method.
         */
        ADABELIEF,
    };
    /**
     * @brief      return value of the sgd_solver() function.
     */
    enum sgd_return_code
    {
        SGD_SUCCESS = 0, ///< The optimization terminated successfully.
        SGD_CONVERGENCE = 1, ///< The optimization reached convergence.
        SGD_STOP, ///< The process stopped by the monitoring function.
        SGD_UNKNOWN_ERROR = -1024, ///< Unknown error.
        SGD_INVALID_VARIABLE_SIZE, ///< The variable size is negative
        SGD_INVALID_EPSILON, ///< The epsilon is negative.
        SGD_REACHED_MAX_ITERATIONS, ///< Iteration reached max limit.
        SGD_INVALID_MU, ///< Invalid value for mu.
        SGD_INVALID_ALPHA, ///< Invalid value for alpha.
        SGD_INVALID_BETA, ///< Invalid value for beta.
        SGD_INVALID_SIGMA, ///< Invalid value for sigma.
        SGD_NAN_VALUE, ///< Nan value.
    };
    /**
     * @brief    Parameters of the SGD methods.
     */
    struct sgd_para
    {
        /**
         * Maximal iteration times. The iteration won't stop unless the convergence 
         * is reached if this parameter is equal to or smaller than zero. The default 
         * is 0.
         */
        int iteration;
        /**
         * Epsilon for convergence test. This parameter determines the accuracy 
         * with which the solution is to be found. Must be bigger than zero and 
         * the default is 1e-6.
         */
        double epsilon;
        /**
         * Damping rate of the classic momentum method and the NAG method, which 
         * is typically given between 0 and 1. The default is 0.01.
         */
        double mu;
        /**
         * Step size of the iteration. The default value is 0.01 for Adam and AdaMax.
         */
        double alpha;
        /**
         * Exponential decay rates for the first order moment estimates. The range of this 
         * parameter is [0, 1) and the default value is 0.9.
         */
        double beta_1;
        /**
         * Exponential decay rates for the second order moment estimates. The range of this 
         * parameter is [0, 1) and the default value is 0.999.
         */
        double beta_2;
        /**
         * A small positive number validates the algorithm. The default value is 1e-8.
         */
        double sigma;
    };
    class sgd_solver
    {
    private:
        sgd_para sgd_param_;
        int sgd_inter_;
        bool sgd_silent_;
        std::string solver_name_;
    public:
        sgd_solver();
        virtual ~sgd_solver();
        virtual double SGD_Evaluate(const array<double> &x, array<double> &g) = 0;
        virtual int SGD_Progress(double fx, const array<double> &x, const sgd_para &param, const int k);
        void sgd_silent();
        void set_sgd_report_interval(int inter);
        void set_sgd_para(const sgd_para &param);
        void show_solver();
        void sgd_error_str(sgd_return_code err_code, std::ostream &ss = std::clog, bool err_throw = false);
        sgd_para default_sgd_para();
 #ifdef GCTL_OPTIMIZATION_TOML
        void set_sgd_para(const toml::value &toml_data);
 #endif // GCTL_OPTIMIZATION_TOML
        sgd_return_code momentum(array<double> &m);
        sgd_return_code nag(array<double> &m);
        sgd_return_code adagrad(array<double> &m);
        sgd_return_code rmsprop(array<double> &m);
        sgd_return_code adam(array<double> &m);
        sgd_return_code nadam(array<double> &m);
        sgd_return_code adamax(array<double> &m);
        sgd_return_code adabelief(array<double> &m);
        void SGD_Minimize(array<double> &m, sgd_solver_type solver_id = ADAM, std::ostream &ss = std::clog, bool verbose = true, bool err_throw = false);
    };
 }
 #endif // _GCTL_SGD_H
--- a/lib/optimization/svd.cpp
+++ b/lib/optimization/svd.cpp
@ -0,0 +1,184 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #include "svd.h"
 gctl::svd::svd()
 {
    reset();
 }
 gctl::svd::svd(const matrix<double> &src_mat) : svd()
 {
    decompose(src_mat);
 }
 void gctl::svd::reset()
 {
    maxi_iteration = 1000;
    K = 0;
    epsilon = 1e-8;
    U.clear();
    V.clear();
    S.clear();
    return;
 }
 void gctl::svd::set_singular_number(int k)
 {
    if (k <= 0)
    {
        throw invalid_argument("Invalid singular number. From gctl::svd::set_singular_number(...)");
    }
    K = k;
    return;
 }
 void gctl::svd::set_iteration(int t)
 {
    if (t <= 0)
    {
        throw invalid_argument("Invalid singular number. From gctl::svd::set_iteration(...)");
    }
    maxi_iteration = t;
    return;
 }
 void gctl::svd::set_epsilon(double e)
 {
    if (e <= 0)
    {
        throw invalid_argument("Invalid singular number. From gctl::svd::set_epsilon(...)");
    }
    epsilon = e;
    return;
 }
 void gctl::svd::decompose(const matrix<double> &src_mat)
 {
    int M = src_mat.row_size();
    int N = src_mat.col_size();
    if (K == 0) K = N;
    S.resize(K, 0.0);
    U.resize(K, M, 0.0);
    V.resize(K, N, 0.0);
    srand(time(0));
    array<double> left_vector(M), next_left_vector(M);
    array<double> right_vector(N), next_right_vector(N);
    array<double> U_tmp(M), V_tmp(N);
    double diff, r, d;
    for(int col=0;col<K;col++)
    {
        diff = 1;
        r = -1;
        while(1)
        {
            for(int i=0;i<M;i++)
                left_vector[i]= (double) rand() / RAND_MAX;
            if(normalize(left_vector, epsilon) > epsilon)
                break;
        }
        for(int iter=0; diff >= epsilon && iter < maxi_iteration; iter++)
        {
            next_left_vector.assign_all(0.0);
            next_right_vector.assign_all(0.0);
            for(int i=0;i<M;i++)
                for(int j=0;j<N;j++)
                    next_right_vector[j]+=left_vector[i]*src_mat[i][j];
            r=normalize(next_right_vector, epsilon);
            if(r<epsilon) break;
            for(int i=0;i<col;i++)
            {
                for (int j = 0; j < N; j++)
                {
                    V_tmp[j] = V[i][j];
                }
                orth(V_tmp, next_right_vector);
            }
            normalize(next_right_vector, epsilon);
            for(int i=0;i<M;i++)
                for(int j=0;j<N;j++)
                    next_left_vector[i]+=next_right_vector[j]*src_mat[i][j];
            r=normalize(next_left_vector, epsilon);
            if(r<epsilon) break;
            for(int i=0;i<col;i++)
            {
                for (int j = 0; j < M; j++)
                {
                    U_tmp[j] = U[i][j];
                }
                orth(U_tmp, next_left_vector);
            }
            normalize(next_left_vector, epsilon);
            diff=0;
            for(int i=0;i<M;i++)
            {
                d=next_left_vector[i]-left_vector[i];
                diff+=d*d;
            }
            for (int i = 0; i < M; i++)
            {
                left_vector[i] = next_left_vector[i];
            }
            for (int i = 0; i < N; i++)
            {
                right_vector[i] = next_right_vector[i];
            }
        }
        if(r>=epsilon)
        {
            S[col]=r;
            for (int i = 0; i < M; i++)
            {
                U[col][i] = left_vector[i];
            }
            for (int i = 0; i < N; i++)
            {
                V[col][i] = right_vector[i];
            }
        }
        else break;
    }
    return;
 }
--- a/lib/optimization/svd.h
+++ b/lib/optimization/svd.h
@ -0,0 +1,71 @@
 /********************************************************
 *  ██████╗  ██████╗████████╗██╗
 * ██╔════╝ ██╔════╝╚══██╔══╝██║
 * ██║  ███╗██║        ██║   ██║
 * ██║   ██║██║        ██║   ██║
 * ╚██████╔╝╚██████╗   ██║   ███████╗
 *  ╚═════╝  ╚═════╝   ╚═╝   ╚══════╝
 * Geophysical Computational Tools & Library (GCTL)
 *
 * Copyright (c) 2022  Yi Zhang (yizhang-geo@zju.edu.cn)
 *
 * GCTL is distributed under a dual licensing scheme. You can redistribute 
 * it and/or modify it under the terms of the GNU Lesser General Public 
 * License as published by the Free Software Foundation, either version 2 
 * of the License, or (at your option) any later version. You should have 
 * received a copy of the GNU Lesser General Public License along with this 
 * program. If not, see <http://www.gnu.org/licenses/>.
 * 
 * If the terms and conditions of the LGPL v.2. would prevent you from using 
 * the GCTL, please consider the option to obtain a commercial license for a 
 * fee. These licenses are offered by the GCTL's original author. As a rule, 
 * licenses are provided "as-is", unlimited in time for a one time fee. Please 
 * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget 
 * to include some description of your company and the realm of its activities. 
 * Also add information on how to contact you by electronic and paper mail.
 ******************************************************/
 #ifndef _GCTL_SVD_H
 #define _GCTL_SVD_H
 #include "gctl/core.h"
 #include "gctl/algorithm.h"
 namespace gctl
 {
    /**
     * @brief      SVD奇异值分解
     * 
     * A = U^T \cdot S \cdot V
     * A     大小为M*N输入的二维数组
     * K     待计算的奇异值与奇异向量的数量
     * U     分解后的U矩阵，大小为K*M
     * S     分解后的对角S矩阵，以向量的形式表示，即前k个特征值，大小1*K
     * V     分解后的V矩阵，大小为K*N
     *
     */
    class svd
    {
    public:
        matrix<double> U, V;
        array<double> S;
        svd();
        svd(const matrix<double> &src_mat);
        virtual ~svd(){}
        void reset();
        void set_singular_number(int k);
        void set_iteration(int t);
        void set_epsilon(double e);
        int get_singular_number(){return K;}
        void decompose(const matrix<double> &src_mat);
    protected:
        int maxi_iteration, K;
        double epsilon;
    };
 }
 #endif // _GCTL_SVD_H