rating/rating.go at master · mashiike/rating · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
// Package rating implements the simple glicko-2 Rating.
// Glicko-2 Rating: see as following. (within this package, denoted as ref[1] below)
//
//   Professor Mark E. Glickman. "Example of the Glicko-2 system" http://www.glicko.net/glicko/glicko2.pdf
//
// Note : The variable names in this package match the mathematical Greek letter variables of the dissertation.
// Note2: This English is written by the power of Google Translate.
package rating

import (
	"encoding/binary"
	"math"
	"sync"

	"github.com/pkg/errors"
)

//Public Constant for rating value
const (
	InitialStrength  = 1500.0
	InitialDeviation = 350.0
)

const (
	//rating <=> glicko2 scale deviation convart rate
	convartRate = 173.7178
	//rating center value
	centerValue = 1500.0
	//start deviation
	startPhi = InitialDeviation / convartRate
	//x ~ N(0,1), this value is z when P(-z <= x <= z) = 0.95
	zscore95 = 1.96

	//iterative algorithm truncates with this number
	iterationLimit = 100000
	//end condition of iterative algorithm
	epsiron = 0.000001

	//ScoreWin is Score when winning an opponent.
	ScoreWin = float64(1.0)
	//ScoreLose is Score when losing to an opponent.
	ScoreLose = float64(0.0)
	//ScoreDraw is Score when tied to an opponent.
	ScoreDraw = float64(0.5)
)

//Rating is a structure to evaluate the strength of a player / team.
type Rating struct {

	// mu is a number representing strength.
	// phi is a numerical value that represents the deviation of strength. as rating deviation:RD.
	// In the glicko-2 system, x ~ N (mu, phi ^ 2) and x are evaluated with a model that considers the strength to be actually exhibited in a match
	// Note: N (0,1) is a standard normal distribution
	mu  float64
	phi float64

	// sigma is a numerical value that represents the volatility of strength.
	// If there is no war during one rating period, RD will rise by the next equation in the next period.
	//
	//   phi_next = sqrt(phi^2 + sigma^2)
	//
	// start phi is 2.014, default phi is 0.2878
	// If you want to return to start phi if you have not played for 100 rating periods.
	//
	//  sigma = sqrt((2.014^2 - 0.2878^2)/100) = 0.1997 ~= 0.2
	//
	// in ref[1], this value is 0.06
	sigma float64
}

//NewVolatility is a helper for determining Volatility.
//Calculate the appropriate value by entering the number of rating periods required to get back to the start deviation and the initial deviation
func NewVolatility(start, count float64) float64 {
	if count <= 0 {
		//Note: If count is 0 or less
		// if there is a non-match rating period,
		// it is considered to be set with the intention of returning to the initial deviation immediately.
		// So, the deviation is 0 and the required period is 1.0
		return NewVolatility(0.0, 1.0)
	}

	return nthFloor(
		math.Sqrt(
			(math.Pow(startPhi, 2)-math.Pow(start/convartRate, 2))/count,
		),
		6,
	)
}

//New is a constractor for Rating
func New(strength, deviation, volatility float64) Rating {
	return Rating{
		mu:    (strength - centerValue) / convartRate,
		phi:   deviation / convartRate,
		sigma: volatility,
	}
}

//Average returns the average strength of multiple Ratings
func Average(ratings []Rating) Rating {
	totalMu := 0.0
	totalSqPhi := 0.0
	totalSigma := 0.0
	length := float64(len(ratings))
	sqLen := math.Pow(length, 2)
	for _, r := range ratings {
		totalMu += r.mu
		totalSqPhi += math.Pow(r.phi, 2)
		totalSigma += r.sigma
	}
	return Rating{
		mu:    totalMu / length,
		phi:   math.Sqrt(totalSqPhi / sqLen),
		sigma: totalSigma / length,
	}
}

// Default is return default rating for starting Player/Team.
func Default(volatility float64) Rating {
	return New(InitialStrength, InitialDeviation, volatility)
}

// Strength is return value of strength, as rating general value.
func (r Rating) Strength() float64 {
	return nthFloor(r.mu*convartRate+centerValue, 2)
}

// Deviation is return RD(Rating Deviation) as general value.
func (r Rating) Deviation() float64 {
	return nthFloor(r.phi*convartRate, 2)
}

// Volatility is return Rating volatility.
func (r Rating) Volatility() float64 {
	return nthFloor(r.sigma, 6)
}

//Interval is return value of strength 95% confidence interval.
func (r Rating) Interval() (float64, float64) {
	s := r.Strength()
	rd2 := r.Deviation() * 2
	return s - rd2, s + rd2
}

//IsDifferent is a function to check the significance of Rating
func (r Rating) IsDifferent(o Rating) bool {
	y := r.mu - o.mu
	z := y / math.Hypot(r.phi, o.phi)
	if math.Abs(z) > zscore95 {
		return true
	}
	return false
}

//IsStronger is checker function. this rating r is storonger than rating o.
func (r Rating) IsStronger(o Rating) bool {
	if r.mu <= o.mu {
		return false
	}
	return r.IsDifferent(o)
}

//IsWeeker is checker function. this rating r is weeker than rating o.
func (r Rating) IsWeeker(o Rating) bool {
	if r.mu >= o.mu {
		return false
	}
	return r.IsDifferent(o)
}

// WinProb is estimate winning probability,
// this value 1500 and 1700, both RD is 0 => P(1700 is win) = 0.76
func (r Rating) WinProb(o Rating) float64 {
	return nthFloor(fE(r.mu, o.mu, math.Hypot(r.phi, o.phi)), 4)
}

func float64ToByte(float float64) []byte {
	bits := math.Float64bits(float)
	bytes := make([]byte, 8)
	binary.LittleEndian.PutUint64(bytes, bits)

	return bytes
}

func byteToFloat64(bytes []byte) float64 {
	bits := binary.LittleEndian.Uint64(bytes)

	return math.Float64frombits(bits)
}

const ratingBinaryVersion byte = 1

// MarshalBinary implements the encoding.BinaryMarshaler interface.
func (r Rating) MarshalBinary() ([]byte, error) {
	b := make([]byte, 0, 25)
	b = append(b, ratingBinaryVersion)
	b = append(b, float64ToByte(r.mu)...)
	b = append(b, float64ToByte(r.phi)...)
	b = append(b, float64ToByte(r.sigma)...)
	return b, nil
}

// UnmarshalBinary implements the encoding.BinaryUnmarshaler interface.
func (r *Rating) UnmarshalBinary(data []byte) error {
	buf := data
	if len(buf) == 0 {
		return errors.New("Rating.UnmarshalBinary: no data")
	}

	if buf[0] != ratingBinaryVersion {
		return errors.New("Rating.UnmarshalBinary: unsupported version")
	}

	if len(buf) != 25 {
		return errors.New("Rating.UnmarshalBinary: invalid length")
	}

	r.mu = byteToFloat64(buf[1:9])
	r.phi = byteToFloat64(buf[9:17])
	r.sigma = byteToFloat64(buf[17:25])
	return nil
}

// MarshalJSON implements the json.Marshaler interface.
// The rating is a quoted string in Default format
func (r Rating) MarshalJSON() ([]byte, error) {
	b := make([]byte, 0, len(DefaultFormat)+2)
	b = append(b, '"')
	b = r.AppendFormat(b, DefaultFormat)
	b = append(b, '"')
	return b, nil
}

// UnmarshalJSON implements the json.Unmarshaler interface.
// The rating is expected to be a quoted string in Default format.
func (r *Rating) UnmarshalJSON(data []byte) error {
	if string(data) == "null" {
		return nil
	}
	var err error
	*r, err = Parse(`"`+DefaultFormat+`"`, string(data))
	return err
}

// MarshalText implements the encoding.TextMarshaler interface.
// The rating is formatted in Default Format.
func (r Rating) MarshalText() ([]byte, error) {
	b := make([]byte, 0, len(DefaultFormat))
	return r.AppendFormat(b, DefaultFormat), nil
}

// UnmarshalText implements the encoding.TextUnmarshaler interface.
// The rating is expected to be in Default Format.
func (r *Rating) UnmarshalText(data []byte) error {
	var err error
	*r, err = Parse(DefaultFormat, string(data))
	return err
}

//Update is utils function for rating update. case non sequentially update, use this function.
func (r Rating) Update(opponents []Rating, scores []float64, tau float64) (Rating, error) {
	if len(opponents) != len(scores) {
		return r, errors.New("opponents and scores length missmatch")
	}
	e := NewEstimated(r)
	for i := 0; i < len(opponents); i++ {
		if err := e.ApplyMatch(opponents[i], scores[i]); err != nil {
			return r, err
		}
	}
	if err := e.Fix(tau); err != nil {
		return r, err
	}
	return e.Fixed, nil
}

// Estimated is a collection of Quantity related estimates that are being corrected.
// If you update the rating sequentially, use this struct to save the learning process during the current rating period.
type Estimated struct {
	sync.Mutex
	// in ref[1], this value is v^-1
	Accuracy float64 `json:"accuracy" db:"accuracy"`
	// in ref[1], this value is delta
	Improvement float64 `json:"improvement" db:"improvement"`
	// base fixed rating
	Fixed Rating `json:"fixed" db:"fixed"`
}

//NewEstimated is initial estimated value constractor
func NewEstimated(rating Rating) *Estimated {
	return &Estimated{
		Accuracy:    0.0,
		Improvement: 0.0,
		Fixed:       rating,
	}
}

// ApplyMatch reflects match results in the training estimates.
func (e *Estimated) ApplyMatch(opponent Rating, score float64) error {
	e.Lock()
	defer e.Unlock()
	if score < 0.0 || score > 1.0 {
		return errors.New("score must be 0 to 1 (win = 1, lose = 0, draw = 0.5)")
	}
	tmp := e.Improvement * e.Accuracy
	valg := fg(opponent.phi)
	valE := fE(e.Fixed.mu, opponent.mu, opponent.phi)
	e.Accuracy += valg * valg * valE * (1.0 - valE)
	tmp += valg * (score - valE)
	e.Improvement = tmp / e.Accuracy
	return nil
}

// Rating returns the current estimate
func (e *Estimated) Rating() Rating {
	return e.computeRating(e.Fixed.sigma)
}

func (e *Estimated) computeRating(sigmaDash float64) Rating {
	phiAsta := math.Hypot(e.Fixed.phi, sigmaDash)
	phiDash := 1.0 / math.Sqrt(1.0/(math.Pow(phiAsta, 2))+e.Accuracy)
	if phiDash > startPhi {
		phiDash = startPhi
	}
	return Rating{
		mu:    e.Fixed.mu + math.Pow(phiDash, 2)*e.Improvement*e.Accuracy,
		phi:   phiDash,
		sigma: sigmaDash,
	}
}

// Fix ends the rating period and determines the new rating.
// system parameter tau. this value for determine next volatility.
// in ref[1] p.1:
// "Reasonable choices are between 0.3 and 1.2,
// though the system should be tested to decide which value results in greatest predictive accuracy. "
func (e *Estimated) Fix(tau float64) error {
	e.Lock()
	defer e.Unlock()
	if tau <= 0 {
		return errors.New("tau must be a nonzero positive number")
	}
	if e.Accuracy == 0.0 {
		// if estimated accuracy is zero, can not apply. because maybe no matches.
		// In this case, rating value and volatility parameters remain the same, but the rating deviation increases
		e.Fixed.phi = math.Hypot(e.Fixed.phi, e.Fixed.sigma)
		if e.Fixed.phi > startPhi {
			e.Fixed.phi = startPhi
		}
		return nil
	}
	alg := &illinois{
		tau: tau,
	}
	e.Fixed = e.computeRating(alg.Do(e))
	return nil
}

type illinois struct {
	tau     float64
	a       float64
	v       float64
	sqDelta float64
	sqPhi   float64
}

func (alg *illinois) Do(e *Estimated) float64 {
	alg.a = math.Log(math.Pow(e.Fixed.sigma, 2))
	A := alg.a
	B := 0.0

	alg.sqDelta = math.Pow(e.Improvement, 2)
	alg.sqPhi = math.Pow(e.Fixed.phi, 2)
	alg.v = 1.0 / e.Accuracy

	switch {
	case alg.sqDelta > alg.sqPhi+alg.v:
		B = math.Log(alg.sqDelta - alg.sqPhi - alg.v)
	default:
		valf := 0.0
		for k := 1; k < iterationLimit+1; k++ {
			B = (alg.a - float64(k)*alg.tau)
			valf = alg.fx(B)
			if valf >= 0.0 {
				break
			}
		}
	}

	valfA := alg.fx(A)
	valfB := alg.fx(B)

	for i := 0; i < iterationLimit; i++ {
		if math.Abs(B-A) <= epsiron {
			break
		}
		C := A + ((A-B)*valfA)/(valfB-valfA)
		valfC := alg.fx(C)
		switch {
		case valfB*valfC < 0.0:
			A = B
			valfA = valfB
		default:
			valfA /= 2.0
		}
		B = C
		valfB = valfC
	}

	return math.Exp(A / 2.0)
}

func (alg *illinois) fx(x float64) float64 {
	sumVal := alg.sqDelta + alg.sqPhi + alg.v
	diffVal := alg.sqDelta - alg.sqPhi - alg.v
	firstTerm := (math.Exp(x) * (diffVal - math.Exp(x))) / (2 * sumVal * sumVal)
	secondTerm := (x - alg.a) / (math.Pow(alg.tau, 2))
	return firstTerm - secondTerm
}

// Truncate at n decimal places
func nthFloor(x float64, ref float64) float64 {
	shift := math.Pow(10, ref)
	return math.Trunc(x*shift) / shift
}

//fE is internal function E( score | mu, mu_j, phi_j)
func fE(mu, muOppo, phiOppo float64) float64 {
	return 1.0 / (1.0 + math.Exp(-1.0*fg(phiOppo)*(mu-muOppo)))
}

//fg is internal function g(phi)
func fg(phi float64) float64 {
	return 1.0 / math.Sqrt(1.0+3.0*(phi*phi)/(math.Pi*math.Pi))
}