基于随机森林回归预测的风机预警模型开发
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.ensemble import RandomForestRegressor
from sklearn.model_selection import train_test_split
from sklearn.multioutput import MultiOutputRegressor
plt.ion()
#prepare Data
inputLabel=["WindSpeed","GenPower","GenSpeed","OutDoorTemp","NacelleTemp"]
outputLabel=["GenBearDETemp","GenBearNDETemp","GenStatorUTemp","GenStatorVTemp", "GenStatorWTemp"]
dataPath="E:/DevRawModelProject/RawModelData/test/goodt20014001f.csv"
data_testPath="E:/DevRawModelProject/RawModelData/test/t20014001_test.csv"
df=pd.read_csv(dataPath)
df_test=pd.read_csv(data_testPath)
X_train, y_train=(df[inputLabel].values,df[outputLabel].values)
X_test, y_test=(df_test[inputLabel].values,df_test[outputLabel].values)
#cal main
max_depth =8
max_depth=max_depth
#random_state=2
regr_rf = RandomForestRegressor(max_depth=max_depth)
regr_rf.fit(X_train, y_train)
RandomForestRegressor(bootstrap=True, criterion='mse', max_depth=8,
max_features='auto', max_leaf_nodes=None,
min_impurity_split=1e-07, min_samples_leaf=1,
min_samples_split=2, min_weight_fraction_leaf=0.0,
n_estimators=10, n_jobs=1, oob_score=False, random_state=None,
verbose=0, warm_start=False)
#test model
y_rf = regr_rf.predict(X_train)
y_test_rf = regr_rf.predict(X_test)
varR=np.var(y_train[:,2]-y_rf[:,2])
varT=np.var(y_train[:,2])
r2=1-varR/varT
print(r2)
0.820108692169
plt.plot(y_test[:,0])
plt.plot(y_test_rf[:,0],'r')
output_4_1.png
print(y_rf.shape)
#plot data
#plt.scatter(X_train,y_train,c="red", marker="+",alpha=0.5,label="Data")
plt.scatter(y_train[:,0],y_rf[:,0],c="cornflowerblue", alpha=0.5,label="predict")
plt.scatter(y_train[:,1],y_rf[:,1],marker="+",c="red", alpha=0.3,label="predict")
#plt.show()
(27627, 5)
<matplotlib.collections.PathCollection at 0xeffacf8>
data:image/s3,"s3://crabby-images/dc76d/dc76d682e00474b31b395036f9918996e1ef874b" alt=""
from mpl_toolkits.mplot3d import Axes3D
fig = plt.figure()
ax = fig.add_subplot(111, projection='3d')
X = X_train[:,0]
Y = X_train[:,1]
Z = y_train[:,2]
ax.scatter(X, Y, Z)
#ax = fig.add_subplot(111, projection='3d')
X = X_train[:,0]
Y = X_train[:,1]
Z =y_rf[:,2]
ax.scatter(X, Y, Z,c="red", marker="+",alpha=0.5,label="Data")
plt.show()
data:image/s3,"s3://crabby-images/6982f/6982f40a68a41611ceb404fa3b4fcad5e11f387c" alt=""
plt.scatter(y_train[:,0],y_train[:,1],c="cornflowerblue",marker="+",alpha=0.5,label="predict")
plt.scatter(y_rf[:,0],y_rf[:,1],marker="+",c="red", alpha=0.3,label="predict")
<matplotlib.collections.PathCollection at 0xd7a1a58>
data:image/s3,"s3://crabby-images/e5294/e52945c8e5ee4ff7c46675a64d495d5589540d5f" alt=""
df.columns
Index(['Unnamed: 0', 'TablePart', 'TurbineID', 'real_time', 'WindSpeed',
'GenPower', 'GenSpeed', 'OutDoorTemp', 'NacelleTemp', 'GenBearDETemp',
'GenBearNDETemp', 'GenStatorUTemp', 'GenStatorVTemp', 'GenStatorWTemp',
'con1'],
dtype='object')
plt.plot(y_train[:,0])
plt.plot(y_rf[:,0])
[<matplotlib.lines.Line2D at 0xb97ee80>]
data:image/s3,"s3://crabby-images/73a99/73a99e5d61796a1405fa462bdace430f6515552a" alt=""
plt.plot(y_train[:,1])
plt.plot(y_rf[:,1])
[<matplotlib.lines.Line2D at 0xf07def0>]
data:image/s3,"s3://crabby-images/89424/894247b7ed79bb8dd05c2a847ed4d2e27cb6b615" alt=""
plt.plot(y_train[:,1]-y_rf[:,1])
[<matplotlib.lines.Line2D at 0xf128dd8>]
data:image/s3,"s3://crabby-images/9094a/9094aae51ee966dcea66adcb3665063b24a9623a" alt=""
plt.plot(y_train[:,0]-y_rf[:,0])
[<matplotlib.lines.Line2D at 0xf18dd30>]
data:image/s3,"s3://crabby-images/99773/997739231b4afe4e1b3a7f797063154ca5f70b36" alt=""
plt.plot(y_train[:,2]-y_rf[:,2])
[<matplotlib.lines.Line2D at 0xf1db080>]
data:image/s3,"s3://crabby-images/513d5/513d57a0a7ad6a0897e424792669bb427af875d9" alt=""
plt.plot(X_train[:,2],y_train[:,2]-y_rf[:,2],'*')
#plt.title("T")
plt.show()
data:image/s3,"s3://crabby-images/ed44c/ed44c812d7ac88a7e915ad803196a2b41f6b51ef" alt=""
import numpy as np
varR=np.var(y_train[:,2]-y_rf[:,2])
varT=np.var(y_train[:,2])
r2=1-varR/varT
print(r2)
0.962437941174
y_test_rf = regr_rf.predict(X_test)
plt.plot(X_test[:,2],y_test[:,2]-y_test_rf[:,2],'*')
#plt.title("T")
plt.show()
data:image/s3,"s3://crabby-images/564ec/564ec05298e7868ecf2bf4cbe5ed697cb8ce7689" alt=""
plt.plot(y_test[:,0],y_test_rf[:,0],'*')
#plt.title("T")
plt.show()
data:image/s3,"s3://crabby-images/d88e7/d88e770ae2e7a15a53766757795578e8413bd558" alt=""
import numpy as np
varR=np.var(y_test[:,2]-y_test_rf[:,2])
varT=np.var(y_test[:,2])
r2=1-varR/varT
print(r2)
0.703730968599
df.WindSpeed.min()
1.02
plt.plot(df['WindSpeed'],df['GenPower'],"+")
plt.plot(df_test['WindSpeed'],df_test['GenPower'],"o")
[<matplotlib.lines.Line2D at 0xf4e4470>]
data:image/s3,"s3://crabby-images/e3551/e35514d749dd40c8f72913e81a04ee610cb34945" alt=""
plt.plot(y_test[:,0]-y_test_rf[:,0])
plt.plot(y_test[:,1]-y_test_rf[:,1])
[<matplotlib.lines.Line2D at 0xfd5e208>]
data:image/s3,"s3://crabby-images/eea66/eea660c588338deecae0d394131ea46ee628ef50" alt=""
plt.plot(y_test[:,0])
plt.plot(y_test_rf[:,0],'r')
[<matplotlib.lines.Line2D at 0xfd2a6d8>]
data:image/s3,"s3://crabby-images/a5a37/a5a3797722af102bb7596521a6c8060180614efd" alt=""
plt.plot(y_train[:,2]-y_rf[:,2],y_train[:,3]-y_rf[:,3],'*')
#plt.title("T")
plt.show()
data:image/s3,"s3://crabby-images/c4ce6/c4ce62db2abbbb594f413963f0a82981f146a9bc" alt=""