-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvariant.go
63 lines (51 loc) · 1.15 KB
/
variant.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
package bandit
import (
"errors"
)
//An individual variant of an experiement.
type Variant interface {
RewardSum() float64
RewardSquareSum() float64
ObservationCount() int
Observe(reward float64) (Variant, error)
}
var OutOfRangeReward = errors.New("Reward is out of range [0, 1)")
// variant implements the Variant interface
var _ Variant = variant{}
// In memory implementation of a variant.
type variant struct {
rewardSum float64
rewardSquareSum float64
observationCount int "oc"
}
func (v variant) RewardSum() float64 {
return v.rewardSum
}
func (v variant) ObservationCount() int {
return v.observationCount
}
func (v variant) RewardSquareSum() float64 {
return v.rewardSquareSum
}
func NewVariant() Variant {
return &variant{}
}
func (v variant) Observe(reward float64) (Variant, error) {
if err := checkReward(reward); err != nil {
return v, err
}
// Updating the variant estimates
v.rewardSum += reward
v.rewardSquareSum += reward * reward
v.observationCount += 1
return v, nil
}
func checkReward(reward float64) error {
if reward < 0 {
return OutOfRangeReward
}
if reward > 1 {
return OutOfRangeReward
}
return nil
}