-
Notifications
You must be signed in to change notification settings - Fork 1.4k
/
Copy paththreshold.py
55 lines (46 loc) · 1.58 KB
/
threshold.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
# This code is supporting material for the book
# Building Machine Learning Systems with Python
# by Willi Richert and Luis Pedro Coelho
# published by PACKT Publishing
#
# It is made available under the MIT License
import numpy as np
# This function was called ``learn_model`` in the first edition
def fit_model(features, labels):
'''Learn a simple threshold model'''
best_acc = -1.0
# Loop over all the features:
for fi in range(features.shape[1]):
thresh = features[:, fi].copy()
# test all feature values in order:
thresh.sort()
for t in thresh:
pred = (features[:, fi] > t)
# Measure the accuracy of this
acc = (pred == labels).mean()
rev_acc = (pred == ~labels).mean()
if rev_acc > acc:
acc = rev_acc
reverse = True
else:
reverse = False
if acc > best_acc:
best_acc = acc
best_fi = fi
best_t = t
best_reverse = reverse
# A model is a threshold and an index
return best_t, best_fi, best_reverse
# This function was called ``apply_model`` in the first edition
def predict(model, features):
'''Apply a learned model'''
# A model is a pair as returned by fit_model
t, fi, reverse = model
if reverse:
return features[:, fi] <= t
else:
return features[:, fi] > t
def accuracy(features, labels, model):
'''Compute the accuracy of the model'''
preds = predict(model, features)
return np.mean(preds == labels)