预测性维护

预测性维护（PdM）是一种数据驱动的预防性维护程序。它是一种主动维护策略，利用传感器在运行期间监测设备的性能和状况。PdM 方法不断分析数据，预测何时进行最佳维护。正确使用时，它可以降低维护成本并防止灾难性设备故障。

在本 Notebook 中，我们将应用 NeuralForecast 在经典的 PHM2008 飞机退化数据集上执行监督式剩余使用寿命 (RUL) 估计。

大纲
1. 安装软件包
2. 加载 PHM2008 飞机退化数据集
3. 拟合和预测 NeuralForecast
4. 评估预测

您可以使用 Google Colab 通过 GPU 运行这些实验。

1. 安装软件包

!pip install neuralforecast datasetsforecast

import logging
import numpy as np
import pandas as pd

import matplotlib.pyplot as plt
plt.rcParams['font.family'] = 'serif'

from neuralforecast.models import NBEATSx
from neuralforecast import NeuralForecast
from neuralforecast.losses.pytorch import HuberLoss

from datasetsforecast.phm2008 import PHM2008

logging.getLogger("pytorch_lightning").setLevel(logging.ERROR)

2. 加载 PHM2008 飞机退化数据集

在这里，我们将加载 Prognosis and Health Management 2008 挑战赛数据集。该数据集使用 Commercial Modular Aero-Propulsion System Simulation 重现了不同飞机在正常条件下，具有不同磨损和制造初始状态的涡扇发动机退化过程。训练数据集包含完整的运行至故障模拟数据，而测试数据集包含故障发生前的序列数据。

Y_train_df, Y_test_df = PHM2008.load(directory='./data', group='FD001', clip_rul=False)
Y_train_df

100%|██████████| 12.4M/12.4M [00:00<00:00, 21.6MiB/s]
INFO:datasetsforecast.utils:Successfully downloaded CMAPSSData.zip, 12437405, bytes.
INFO:datasetsforecast.utils:Decompressing zip file...
INFO:datasetsforecast.utils:Successfully decompressed data\phm2008\CMAPSSData.zip

	unique_id	ds	s_2	s_3	s_4	s_7	s_8	s_9	s_11	s_12	s_13	s_14	s_15	s_17	s_20	s_21	y
0	1	1	641.82	1589.70	1400.60	554.36	2388.06	9046.19	47.47	521.66	2388.02	8138.62	8.4195	392	39.06	23.4190	191
1	1	2	642.15	1591.82	1403.14	553.75	2388.04	9044.07	47.49	522.28	2388.07	8131.49	8.4318	392	39.00	23.4236	190
2	1	3	642.35	1587.99	1404.20	554.26	2388.08	9052.94	47.27	522.42	2388.03	8133.23	8.4178	390	38.95	23.3442	189
3	1	4	642.35	1582.79	1401.87	554.45	2388.11	9049.48	47.13	522.86	2388.08	8133.83	8.3682	392	38.88	23.3739	188
4	1	5	642.37	1582.85	1406.22	554.00	2388.06	9055.15	47.28	522.19	2388.04	8133.80	8.4294	393	38.90	23.4044	187
…	…	…	…	…	…	…	…	…	…	…	…	…	…	…	…	…	…
20626	100	196	643.49	1597.98	1428.63	551.43	2388.19	9065.52	48.07	519.49	2388.26	8137.60	8.4956	397	38.49	22.9735	4
20627	100	197	643.54	1604.50	1433.58	550.86	2388.23	9065.11	48.04	519.68	2388.22	8136.50	8.5139	395	38.30	23.1594	3
20628	100	198	643.42	1602.46	1428.18	550.94	2388.24	9065.90	48.09	520.01	2388.24	8141.05	8.5646	398	38.44	22.9333	2
20629	100	199	643.23	1605.26	1426.53	550.68	2388.25	9073.72	48.39	519.67	2388.23	8139.29	8.5389	395	38.29	23.0640	1
20630	100	200	643.85	1600.38	1432.14	550.79	2388.26	9061.48	48.20	519.30	2388.26	8137.33	8.5036	396	38.37	23.0522	0

plot_df1 = Y_train_df[Y_train_df['unique_id']==1]
plot_df2 = Y_train_df[Y_train_df['unique_id']==2]
plot_df3 = Y_train_df[Y_train_df['unique_id']==3]

plt.plot(plot_df1.ds, np.minimum(plot_df1.y, 125), color='#2D6B8F', linestyle='--')
plt.plot(plot_df1.ds, plot_df1.y, color='#2D6B8F', label='Engine 1')

plt.plot(plot_df2.ds, np.minimum(plot_df2.y, 125)+1.5, color='#CA6F6A', linestyle='--')
plt.plot(plot_df2.ds, plot_df2.y+1.5, color='#CA6F6A', label='Engine 2')

plt.plot(plot_df3.ds, np.minimum(plot_df3.y, 125)-1.5, color='#D5BC67', linestyle='--')
plt.plot(plot_df3.ds, plot_df3.y-1.5, color='#D5BC67', label='Engine 3')

plt.ylabel('Remaining Useful Life (RUL)', fontsize=15)
plt.xlabel('Time Cycle', fontsize=15)
plt.legend()
plt.grid()

def smooth(s, b = 0.98):
    v = np.zeros(len(s)+1) #v_0 is already 0.
    bc = np.zeros(len(s)+1)
    for i in range(1, len(v)): #v_t = 0.95
        v[i] = (b * v[i-1] + (1-b) * s[i-1]) 
        bc[i] = 1 - b**i
    sm = v[1:] / bc[1:]
    return sm

unique_id = 1
plot_df = Y_train_df[Y_train_df.unique_id == unique_id].copy()

fig, axes = plt.subplots(2,3, figsize = (8,5))
fig.tight_layout()

j = -1
#, 's_11', 's_12', 's_13', 's_14', 's_15', 's_17', 's_20', 's_21'
for feature in ['s_2', 's_3', 's_4', 's_7', 's_8', 's_9']:
    if ('s' in feature) and ('smoothed' not in feature):
        j += 1
        axes[j // 3, j % 3].plot(plot_df.ds, plot_df[feature], 
                                 c = '#2D6B8F', label = 'original')
        axes[j // 3, j % 3].plot(plot_df.ds, smooth(plot_df[feature].values), 
                                 c = '#CA6F6A', label = 'smoothed')
        #axes[j // 3, j % 3].plot([10,10],[0,1], c = 'black')
        axes[j // 3, j % 3].set_title(feature)
        axes[j // 3, j % 3].grid()
        axes[j // 3, j % 3].legend()
        
plt.suptitle(f'Engine {unique_id} sensor records')
plt.tight_layout()

3. 拟合和预测 NeuralForecast

NeuralForecast 方法能够解决涉及各种变量的回归问题。回归问题包括根据滞后 $y_{:t}$ 、时间外生特征 $x^{(h)}_{:t}$ 、预测时可用的外生特征 $x^{(f)}_{:t+h}$ 以及静态特征 $x^{(s)}$ 来预测目标变量 $y_{t+h}$ 。

剩余使用寿命（RUL）估计的任务将问题简化为单一时间范围预测 $h=1$ ，目标是根据外生特征 $x^{(f)}_{:t+1}$ 和静态特征 $x^{(s)}$ 来预测 $y_{t+1}$ 。在 RUL 估计任务中，外生特征通常对应于传感器监测信息，而目标变量代表 RUL 本身。

$P(y_{t+1}\;|\;x^{(f)}_{:t+1},x^{(s)})$

Y_train_df, Y_test_df = PHM2008.load(directory='./data', group='FD001', clip_rul=True)
max_ds = Y_train_df.groupby('unique_id')["ds"].max()
Y_test_df = Y_test_df.merge(max_ds, on='unique_id', how='left', suffixes=('', '_train_max_date'))
Y_test_df["ds"] = Y_test_df["ds"] + Y_test_df["ds_train_max_date"]
Y_test_df = Y_test_df.drop(columns=["ds_train_max_date"])

futr_exog_list =['s_2', 's_3', 's_4', 's_7', 's_8', 's_9', 's_11',
                 's_12', 's_13', 's_14', 's_15', 's_17', 's_20', 's_21']

model = NBEATSx(h=1, 
                input_size=24,
                loss=HuberLoss(),
                scaler_type='robust',
                stack_types=['identity', 'identity', 'identity'],
                dropout_prob_theta=0.5,
                futr_exog_list=futr_exog_list,
                exclude_insample_y = True,
                max_steps=1000)
nf = NeuralForecast(models=[model], freq=1)

nf.fit(df=Y_train_df)
Y_hat_df = nf.predict(futr_df=Y_test_df)

4. 评估预测

在原始的 PHM2008 数据集中，测试集的真实 RUL 值仅提供给每个发动机的最后一个时间周期。我们将过滤预测结果，仅评估最后一个时间周期。

$RMSE(\mathbf{y}_{T},\hat{\mathbf{y}}_{T}) = \sqrt{\frac{1}{|\mathcal{D}_{test}|} \sum_{i} (y_{i,T}-\hat{y}_{i,T})^{2}}$

from utilsforecast.evaluation import evaluate
from utilsforecast.losses import rmse

metrics = evaluate(Y_hat_df.merge(Y_test_df[["unique_id", "ds", "y"]], on=['unique_id', 'ds']),
                   metrics=[rmse],
                   agg_fn='mean')

metrics

	指标	NBEATSx
0	rmse	118.179373

plot_df1 = Y_hat_df2[Y_hat_df2['unique_id']==1]
plot_df2 = Y_hat_df2[Y_hat_df2['unique_id']==2]
plot_df3 = Y_hat_df2[Y_hat_df2['unique_id']==3]

plt.plot(plot_df1.ds, plot_df1['y'], c='#2D6B8F', label='E1 true RUL')
plt.plot(plot_df1.ds, plot_df1[model_name]+1, c='#2D6B8F', linestyle='--', label='E1 predicted RUL')

plt.plot(plot_df1.ds, plot_df2['y'], c='#CA6F6A', label='E2 true RUL')
plt.plot(plot_df1.ds, plot_df2[model_name]+1, c='#CA6F6A', linestyle='--', label='E2 predicted RUL')

plt.plot(plot_df1.ds, plot_df3['y'], c='#D5BC67', label='E3 true RUL')
plt.plot(plot_df1.ds, plot_df3[model_name]+1, c='#D5BC67', linestyle='--', label='E3 predicted RUL')

plt.legend()
plt.grid()

开始

功能

教程

使用案例

API 参考

1. 安装软件包

2. 加载 PHM2008 飞机退化数据集

3. 拟合和预测 NeuralForecast

4. 评估预测

参考资料

开始

功能

教程

使用案例

API 参考

​1. 安装软件包

​2. 加载 PHM2008 飞机退化数据集

​3. 拟合和预测 NeuralForecast

​4. 评估预测

​参考资料

1. 安装软件包

2. 加载 PHM2008 飞机退化数据集

3. 拟合和预测 NeuralForecast

4. 评估预测

参考资料