简单版本,按照李航的《统计学习方法》的思路编写
数据采用了著名的sklearn自带的iries数据,最优化求解采用了SGD算法。
预处理增加了标准化操作。
''' perceptron classifier created on 2019.9.14 author: vince ''' import pandas import numpy import logging import matplotlib.pyplot as plt from sklearn.datasets import load_iris from sklearn.model_selection import train_test_split from sklearn.metrics import accuracy_score ''' perceptron classifier Attributes w: ld-array = weights after training l: list = number of misclassification during each iteration ''' class Perceptron: def __init__(self, eta = 0.01, iter_num = 50, batch_size = 1): ''' eta: float = learning rate (between 0.0 and 1.0). iter_num: int = iteration over the training dataset. batch_size: int = gradient descent batch number, if batch_size == 1, used SGD; if batch_size == 0, use BGD; else MBGD; ''' self.eta = eta; self.iter_num = iter_num; self.batch_size = batch_size; def train(self, X, Y): ''' train training data. X:{array-like}, shape=[n_samples, n_features] = Training vectors, where n_samples is the number of training samples and n_features is the number of features. Y:{array-like}, share=[n_samples] = traget values. ''' self.w = numpy.zeros(1 + X.shape[1]); self.l = numpy.zeros(self.iter_num); for iter_index in range(self.iter_num): for sample_index in range(X.shape[0]): if (self.activation(X[sample_index]) != Y[sample_index]): logging.debug("%s: pred(%s), label(%s), %s, %s" % (sample_index, self.net_input(X[sample_index]) , Y[sample_index], X[sample_index, 0], X[sample_index, 1])); self.l[iter_index] += 1; for sample_index in range(X.shape[0]): if (self.activation(X[sample_index]) != Y[sample_index]): self.w[0] += self.eta * Y[sample_index]; self.w[1:] += self.eta * numpy.dot(X[sample_index], Y[sample_index]); break; logging.info("iter %s: %s, %s, %s, %s" % (iter_index, self.w[0], self.w[1], self.w[2], self.l[iter_index])); def activation(self, x): return numpy.where(self.net_input(x) >= 0.0 , 1 , -1); def net_input(self, x): return numpy.dot(x, self.w[1:]) + self.w[0]; def predict(self, x): return self.activation(x); def main(): logging.basicConfig(level = logging.INFO, format = '%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s', datefmt = '%a, %d %b %Y %H:%M:%S'); iris = load_iris(); features = iris.data[:99, [0, 2]]; # normalization features_std = numpy.copy(features); for i in range(features.shape[1]): features_std[:, i] = (features_std[:, i] - features[:, i].mean()) / features[:, i].std(); labels = numpy.where(iris.target[:99] == 0, -1, 1); # 2/3 data from training, 1/3 data for testing train_features, test_features, train_labels, test_labels = train_test_split( features_std, labels, test_size = 0.33, random_state = 23323); logging.info("train set shape:%s" % (str(train_features.shape))); p = Perceptron(); p.train(train_features, train_labels); test_predict = numpy.array([]); for feature in test_features: predict_label = p.predict(feature); test_predict = numpy.append(test_predict, predict_label); score = accuracy_score(test_labels, test_predict); logging.info("The accruacy score is: %s "% (str(score))); #plot x_min, x_max = train_features[:, 0].min() - 1, train_features[:, 0].max() + 1; y_min, y_max = train_features[:, 1].min() - 1, train_features[:, 1].max() + 1; plt.xlim(x_min, x_max); plt.ylim(y_min, y_max); plt.xlabel("width"); plt.ylabel("heigt"); plt.scatter(train_features[:, 0], train_features[:, 1], c = train_labels, marker = 'o', s = 10); k = - p.w[1] / p.w[2]; d = - p.w[0] / p.w[2]; plt.plot([x_min, x_max], [k * x_min + d, k * x_max + d], "go-"); plt.show(); if __name__ == "__main__": main();
以上就是本文的全部内容,希望对大家的学习有所帮助,也希望大家多多支持。
华山资源网 Design By www.eoogi.com
广告合作:本站广告合作请联系QQ:858582 申请时备注:广告合作(否则不回)
免责声明:本站资源来自互联网收集,仅供用于学习和交流,请遵循相关法律法规,本站一切资源不代表本站立场,如有侵权、后门、不妥请联系本站删除!
免责声明:本站资源来自互联网收集,仅供用于学习和交流,请遵循相关法律法规,本站一切资源不代表本站立场,如有侵权、后门、不妥请联系本站删除!
华山资源网 Design By www.eoogi.com
暂无评论...
P70系列延期,华为新旗舰将在下月发布
3月20日消息,近期博主@数码闲聊站 透露,原定三月份发布的华为新旗舰P70系列延期发布,预计4月份上市。
而博主@定焦数码 爆料,华为的P70系列在定位上已经超过了Mate60,成为了重要的旗舰系列之一。它肩负着重返影像领域顶尖的使命。那么这次P70会带来哪些令人惊艳的创新呢?
根据目前爆料的消息来看,华为P70系列将推出三个版本,其中P70和P70 Pro采用了三角形的摄像头模组设计,而P70 Art则采用了与上一代P60 Art相似的不规则形状设计。这样的外观是否好看见仁见智,但辨识度绝对拉满。
更新日志
2024年11月21日
2024年11月21日
- 罗大佑-无法盗版的青春套装版10CD【WAV】
- 张学友《意乱情迷》蜚声环球 2024 [WAV+CUE][1G]
- 柏菲《好歌30年特别版2CD》最好听的影视歌曲[低速原抓WAV+CUE][1G]
- 张学友《世纪10星·永恒篇》香港版[WAV+CUE][1G]
- 模拟之声慢刻CD《刘德海.琵琶独奏精逊【低速原抓WAV+CUE】
- Jamettone-18052023—improv(EDit)(2024)【FLAC】
- 【索尼精芽20首最棒的苏格兰歌曲集【FLAC】
- 池约翰C.J《少年白马醉春风2 动画原声带》[320K/MP3][26.67MB]
- 池约翰C.J《少年白马醉春风2 动画原声带》[FLAC/分轨][144.13MB]
- 陈致逸《幻想乐园 Fantasyland》[320K/MP3][120.54MB]
- 席卷全球最红舞曲《火辣辣DJ[英文版]》[DTS-WAV]
- 群星-席卷全球最红舞曲《火辣辣DJ中文版》【WAV】
- 模拟之声慢刻CD《声入人心[年度发烧人声严选]》[低速原抓WAV+CUE]
- 陈致逸《幻想乐园 Fantasyland》[FLAC/分轨][554.27MB]
- Rhymist / LusciousBB《年轮》[320K/MP3][76.52MB]