第十一课.高斯过程_tzc_fly的博客

相关文章推荐

文武双全的书包 · 机器学习技术：高斯过程初探- 开发者头条· 1 年前 ·

文武双全的书包 · 万字总结复杂而奇妙的高斯过程！_Sim148 ...· 1 年前 ·

文武双全的书包 · 7 布朗运动| 应用随机过程· 1 年前 ·

文武双全的书包 · 第十一课.高斯过程_tzc_fly的博客-C ...· 1 年前 ·

文武双全的书包 · 高斯过程_百度百科· 1 年前 ·

def gaussian_kernel ( x1 , x2 , l = 1.0 , sigma_f = 1.0 ) : """RBF""" m , n = x1 . shape [ 0 ] , x2 . shape [ 0 ] dist_matrix = np . zeros ( ( m , n ) , dtype = float ) for i in range ( m ) : for j in range ( n ) : dist_matrix [ i ] [ j ] = np . sum ( ( x1 [ i ] - x2 [ j ] ) ** 2 ) return sigma_f ** 2 * np . exp ( - 0.5 / l ** 2 * dist_matrix ) train_X = np . array ( [ 1 , 3 , 7 , 9 ] ) . reshape ( - 1 , 1 ) #转换为4*1矩阵形式 print ( gaussian_kernel ( train_X , train_X ) ) [[1.00000000e+00 1.35335283e-01 1.52299797e-08 1.26641655e-14] [1.35335283e-01 1.00000000e+00 3.35462628e-04 1.52299797e-08] [1.52299797e-08 3.35462628e-04 1.00000000e+00 1.35335283e-01] [1.26641655e-14 1.52299797e-08 1.35335283e-01 1.00000000e+00]]

输入为4个时间点 $定义一个高斯过程，但是由于没有任何观测值，所以这是一个先验对象。如果获得一组观测值后，我们需要修正高斯过程的均值函数与核函数，得到后验对象。$

首先回顾高维高斯分布的条件概率，补充一点，高斯分布具有一个特点：高斯分布的联合概率，边缘概率，条件概率仍然满足高斯分布。

gaussian_kernel ( x1 , x2 , l = 0.5 , sigma_f = 0.2 ) : m , n = x1 . shape [ 0 ] , x2 . shape [ 0 ] dist_matrix = np . zeros ( ( m , n ) , dtype = float ) for i in range ( m ) : for j in range ( n ) : dist_matrix [ i ] [ j ] = np . sum ( ( x1 [ i ] - x2 [ j ] ) ** 2 ) return sigma_f ** 2 * np . exp ( - 0.5 / l ** 2 * dist_matrix ) #生成观测值，取sin函数没有别的用意，单纯就是为了计算出Y def getY ( X ) : X = np . asarray ( X ) Y = np . sin ( X ) * 0.4 + np . random . normal ( 0 , 0.05 , size = X . shape ) return Y . tolist ( ) #根据观察点X，修正生成高斯过程新的均值和协方差 def update ( X , X_star ) : X = np . asarray ( X ) X_star = np . asarray ( X_star ) K_YY = gaussian_kernel ( X , X ) # K(X,X) K_ff = gaussian_kernel ( X_star , X_star ) # K(X*, X*) K_Yf = gaussian_kernel ( X , X_star ) # K(X, X*) K_fY = K_Yf . T # K(X*, X) 协方差矩阵是对称的，因此分块互为转置 K_YY_inv = np . linalg . inv ( K_YY + 1e - 8 * np . (adsbygoogle = window.adsbygoogle || []).push({}); eye ( len ( X ) ) ) # (N, N) mu_star = K_fY . dot ( K_YY_inv ) . dot ( Y ) cov_star = K_ff - K_fY . dot ( K_YY_inv ) . dot ( K_Yf ) return mu_star , cov_star f , ax = plt . subplots ( 2 , 1 , sharex = True , sharey = True ) #绘制高斯过程的先验 X_pre = np . arange ( 0 , 10 , 0.1 ) mu_pre = np . array ( [ 0 ] * len ( X_pre ) ) Y_pre = mu_pre cov_pre = gaussian_kernel ( X_pre , X_pre ) uncertainty = 1.96 * np . sqrt ( np . diag ( cov_pre ) ) #取95%置信区间 """95%可能性,该区间包含了这个时刻下的高斯分布均值""" ax [ 0 ] . fill_between ( X_pre , Y_pre + uncertainty , Y_pre - uncertainty , alpha = 0.1 ) ax [ 0 ] . plot ( X_pre , Y_pre , label = "expection" ) ax [ 0 ] . legend ( ) #绘制基于观测值的高斯过程后验 X = np . array ( [ 1 , 3 , 7 , 9 ] ) . reshape ( - 1 , 1 ) #4*1矩阵 Y = getY ( X ) X_star = np . arange ( 0 , 10 , 0.1 ) . reshape ( - 1 , 1 ) mu_star , cov_star = update ( X , X_star ) print ( mu_star . shape ) # (100,1) print ( cov_star . shape ) # (100,100) 反映100个时刻各自之间的方差 # 将高维数组展开成一维 Y_star = mu_star . ravel ( ) # (100,) # 时刻9的值(后验，真实) print ( Y_star [ 90 ] , Y [ 3 ] ) # 0.10295047719514798 0.10295050291616215 uncertainty = 1.96 * np . sqrt ( np . diag ( cov_star ) ) #取95%置信区间 ax [ 1 ] . fill_between ( X_star . ravel ( ) , Y_star + uncertainty , Y_star - uncertainty , alpha = 0.1 ) ax [ 1 ] . plot ( X_star , Y_star , label = "expection" ) ax [ 1 ] . scatter ( X , Y , label = "observation point" , c = "red" , marker = "x" ) ax [ 1 ] . legend ( ) plt . show ( )

补充内容：关于置信区间