def colicTest(): frTrain = open('horseColicTraining.txt') frTest = open('horseColicTest.txt') trainingSet = [] trainingLabels = [] for line in frTrain.readlines(): currLine = line.strip().split('\t') lineArr = [] for i in range(21): lineArr.append(float(currLine[i])) trainingSet.append(lineArr) trainingLabels.append(float(currLine[21])) trainWeights = stocGradAscent1(array(trainingSet), trainingLabels, 1000) #计算回归系数向量,迭代1000次 errorCount = 0 numTestVec = 0.0 for line in frTest.readlines(): #导入测试集计算分类错误率 numTestVec += 1.0 currLine = line.strip().split('\t') lineArr = [] for i in range(21): lineArr.append(float(currLine[i])) if int(classifyVector(array(lineArr), trainWeights)) != int(currLine[21]): errorCount += 1 errorRate = (float(errorCount)/numTestVec) print("the error rate of this test is: %f" % errorRate) return errorRate
def multiTest(): numTests = 10 errorSum=0.0 for k in range(numTests): # 计算10次求平均值 errorSum += colicTest() print("after %d iterations the average error rate is: %f" % (numTests, errorSum/float(numTests)))
Post title:Logistic Regression
Post author:langu_xyz
Create time:2019-07-27 21:00:00
Post link:https://blog.langu.xyz/Logistic Regression/
Copyright Notice:All articles in this blog are licensed under BY-NC-SA unless stating additionally.