大資料入門——手寫體資料識別(支援向量機)
阿新 • • 發佈:2018-12-30
#手寫體資料讀取 from sklearn.datasets import load_digits digits=load_digits() print(digits.data.shape) #手寫體資料分割 from sklearn.cross_validation import train_test_split X_train, X_test, y_train, y_test=train_test_split(digits.data, digits.target, test_size=0.25, random_state=33) print(y_train.shape) print(y_test.shape) #使用支援向量機進行識別 from sklearn.preprocessing import StandardScaler from sklearn.svm import LinearSVC ss=StandardScaler() X_train=ss.fit_transform(X_train) X_test=ss.transform(X_test) lsvc=LinearSVC() lsvc.fit(X_train, y_train) y_predict=lsvc.predict(X_test) #支援向量機模型的評估 print('The Accuracy of Linear SVC is', lsvc.score(X_test, y_test)) from sklearn.metrics import classification_report print(classification_report(y_test, y_predict, target_names=digits.target_names.astype(str)))