from sklearn.linear_model import LinearRegression from sklearn.neighbors import KNeighborsClassifier from sklearn.ensemble import RandomForestClassifier
2 通用模式
2.1 分为训练集和测试集
1 2 3
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0)
2.2 建立模型
1 2 3
from sklearn.neighbors import KNeighborsClassifier
knn = KNeighborsClassifier()
2.3 训练
1
knn.fit(X_train, y_train)
2.4 预测
1
knn.predict(X_test)
2.5 准确率
2.5.1 方法1
1
print(knn.score(X_test, y_test))
2.5.2 方法2
1 2 3
from sklearn.metrics import accuracy_score
score = accuracy_score(predict, test_labels)
3 数据预处理
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
from sklearn import preprocessing import numpy as np