Cholesky分解法又叫平方根法,是求解对称正定线性方程组最常用的方法之一。对于一般矩阵,为了消除LU分
解的局限性和误差的过分积累,采用了选主元的方法,但对于对称正定矩阵而言,选主元是不必要的。
定理:若
对称正定,则存在一个对角元为正数的下三角矩阵
,使得
成立。
假设现在要求解线性方程组
,其中
为对称正定矩阵,那么
可通过下面步骤求解
(1)求
的Cholesky分解,得到data:image/s3,"s3://crabby-images/9e9d3/9e9d3d6d4dbb8e037f366f2d49c17c11edc5777b" alt=""
(2)求解
,得到data:image/s3,"s3://crabby-images/67a84/67a84c046fff9d0c45dd3b4f30952ea29d50bb47" alt=""
(3)求解
,得到data:image/s3,"s3://crabby-images/c6607/c6607e09e6e82f33e1ef2c9716effba0e50eefb0" alt=""
现在的关键问题是对
进行Cholesky分解。假设
data:image/s3,"s3://crabby-images/e960f/e960f34dc8a849a9cdd68adcb79d7b36a48be646" alt="Cholesky分解法_第1张图片"
通过
比较两边的关系,首先由
,再由
data:image/s3,"s3://crabby-images/950cc/950cc6944e2439fe19d8b26637249fec6394ae66" alt=""
这样便得到了矩阵
的第一列元素,假定已经算出了
的前
列元素,通过
data:image/s3,"s3://crabby-images/ab55f/ab55fbe5d4dbfe573f08f608ccfc6010f262820e" alt=""
可以得到
data:image/s3,"s3://crabby-images/4c7ad/4c7ad82361ac6b9dac5d172215f2b30c0eed4648" alt=""
进一步再由
data:image/s3,"s3://crabby-images/96d0f/96d0f7a9c012420e8a9045fd97b12f4fa784f444" alt=""
最终得到
data:image/s3,"s3://crabby-images/36a2f/36a2f7d5971c6ef9d44fc0907ab088d7ad60cbf5" alt=""
这样便通过
的前
列求出了第
列,一直递推下去即可求出
,这种方法称为平方根法。
代码:
- #include <iostream>
- #include <string.h>
- #include <stdio.h>
- #include <vector>
- #include <math.h>
-
- using namespace std;
- const int N = 1005;
- typedef double Type;
-
- Type A[N][N], L[N][N];
-
-
- void Cholesky(Type A[][N], Type L[][N], int n)
- {
- for(int k = 0; k < n; k++)
- {
- Type sum = 0;
- for(int i = 0; i < k; i++)
- sum += L[k][i] * L[k][i];
- sum = A[k][k] - sum;
- L[k][k] = sqrt(sum > 0 ? sum : 0);
- for(int i = k + 1; i < n; i++)
- {
- sum = 0;
- for(int j = 0; j < k; j++)
- sum += L[i][j] * L[k][j];
- L[i][k] = (A[i][k] - sum) / L[k][k];
- }
- for(int j = 0; j < k; j++)
- L[j][k] = 0;
- }
- }
-
-
- vector<Type> Solve(Type L[][N], vector<Type> X, int n)
- {
-
- for(int k = 0; k < n; k++)
- {
- for(int i = 0; i < k; i++)
- X[k] -= X[i] * L[k][i];
- X[k] /= L[k][k];
- }
-
- for(int k = n - 1; k >= 0; k--)
- {
- for(int i = k + 1; i < n; i++)
- X[k] -= X[i] * L[i][k];
- X[k] /= L[k][k];
- }
- return X;
- }
-
- void Print(Type L[][N], const vector<Type> B, int n)
- {
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- cout<<L[i][j]<<" ";
- cout<<endl;
- }
- cout<<endl;
- vector<Type> X = Solve(L, B, n);
- vector<Type>::iterator it;
- for(it = X.begin(); it != X.end(); it++)
- cout<<*it<<" ";
- cout<<endl;
- }
-
- int main()
- {
- int n;
- cin>>n;
- memset(L, 0, sizeof(L));
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- cin>>A[i][j];
- }
- vector<Type> B;
- for(int i = 0; i < n; i++)
- {
- Type y;
- cin>>y;
- B.push_back(y);
- }
- Cholesky(A, L, n);
- Print(L, B, n);
- return 0;
- }
-
-
-
-
-
-
-
-
-
用上述的方法需要进行开方,这有可能损失精度和增加运算量,为了避免开方,Cholesky分解有个改进的版本。
将对称正定矩阵
通过分解成
,其中
是单位下三角矩阵,
是对角均为正数的对角矩阵。把这
一分解叫做
分解,是Cholesky分解的变形。对应两边的元素,很容易得到
data:image/s3,"s3://crabby-images/57451/57451319f2f7f05205ec801f3e81398601bffcb0" alt=""
由此可以确定计算
和
的公式如下
data:image/s3,"s3://crabby-images/f2136/f213618e6492b04c6b2e1a0e65ad9f024a9d1ab3" alt="Cholesky分解法_第2张图片"
在实际计算时,是将
的严格下三角元素存储在
的对应位置上,而将
的对角元存储在
的对应的对角位置上。
类似地求解线性方程组
的解步骤如下
(1)对矩阵
进行分解得到data:image/s3,"s3://crabby-images/13bba/13bba7cc86291d38f78b1baacd4c0f8fda3a487d" alt=""
(2)求解
,得到data:image/s3,"s3://crabby-images/dfd43/dfd43e9e2575568811d9cc052ca60212aced0b73" alt=""
(3)求解
,得到data:image/s3,"s3://crabby-images/0c27d/0c27d92837cbff2490da12c218a6b6c295d71267" alt=""
代码:
- #include <iostream>
- #include <string.h>
- #include <stdio.h>
- #include <vector>
- #include <math.h>
-
- using namespace std;
- const int N = 1005;
- typedef double Type;
-
- Type A[N][N], L[N][N], D[N][N];
-
-
- void Cholesky(Type A[][N], Type L[][N], Type D[][N], int n)
- {
- for(int k = 0; k < n; k++)
- {
- for(int i = 0; i < k; i++)
- A[k][k] -= A[i][i] * A[k][i] * A[k][i];
- for(int j = k + 1; j < n; j++)
- {
- for(int i = 0; i < k; i++)
- A[j][k] -= A[j][i] * A[i][i] * A[k][i];
- A[j][k] /= A[k][k];
- }
- }
- memset(L, 0, sizeof(L));
- memset(D, 0, sizeof(D));
- for(int i = 0; i < n; i++)
- {
- D[i][i] = A[i][i];
- L[i][i] = 1;
- }
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < i; j++)
- L[i][j] = A[i][j];
- }
- }
-
- void Transposition(Type L[][N], int n)
- {
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < i; j++)
- swap(L[i][j], L[j][i]);
- }
- }
-
- void Multi(Type A[][N], Type B[][N], int n)
- {
- Type **C = new Type*[n];
- for(int i = 0; i < n; i++)
- C[i] = new Type[n];
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- {
- C[i][j] = 0;
- for(int k = 0; k < n; k++)
- C[i][j] += A[i][k] * B[k][j];
- }
- }
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- B[i][j] = C[i][j];
- }
- for(int i = 0; i < n; i++)
- {
- delete[] C[i];
- C[i] = NULL;
- }
- delete C;
- C = NULL;
- }
-
-
- vector<Type> Solve(Type L[][N], Type D[][N], vector<Type> X, int n)
- {
-
- for(int k = 0; k < n; k++)
- {
- for(int i = 0; i < k; i++)
- X[k] -= X[i] * L[k][i];
- X[k] /= L[k][k];
- }
-
- Transposition(L, n);
- Multi(D, L, n);
- for(int k = n - 1; k >= 0; k--)
- {
- for(int i = k + 1; i < n; i++)
- X[k] -= X[i] * L[k][i];
- X[k] /= L[k][k];
- }
- return X;
- }
-
- void Print(Type L[][N], Type D[][N], const vector<Type> B, int n)
- {
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- cout<<L[i][j]<<" ";
- cout<<endl;
- }
- cout<<endl;
- vector<Type> X = Solve(L, D, B, n);
- vector<Type>::iterator it;
- for(it = X.begin(); it != X.end(); it++)
- cout<<*it<<" ";
- cout<<endl;
- }
-
- int main()
- {
- int n;
- cin>>n;
- memset(L, 0, sizeof(L));
- for(int i = 0; i < n; i++)
- {
- for(int j = 0; j < n; j++)
- cin>>A[i][j];
- }
- vector<Type> B;
- for(int i = 0; i < n; i++)
- {
- Type y;
- cin>>y;
- B.push_back(y);
- }
- Cholesky(A, L, D, n);
- Print(L, D, B, n);
- return 0;
- }
-
-
-
-
-
-
-
-
-
参考资料:http://class.htu.cn/nla/cha1/sect3.htm