Commit dab8af3af48f705feb0b7b683b385ffc11ccb3ca - golang-github-beorn7-perks

Use a map for targets. Bjoern Rabenstein 9 years ago

3 changed file(s) with 43 addition(s) and 46 deletion(s). Raw diff Collapse all Expand all

-4

quantile/bench_test.go less more

6	6	func BenchmarkInsertTargeted(b *testing.B) {
7	7	b.ReportAllocs()
8	8
9		s := NewTargeted(Targets...)
	9	s := NewTargeted(Targets)
10	10	b.ResetTimer()
11	11	for i := float64(0); i < float64(b.N); i++ {
12	12	s.Insert(i)

14	14	}
15	15
16	16	func BenchmarkInsertTargetedSmallEpsilon(b *testing.B) {
17		s := NewTargeted(TargetsSmallEpsilon...)
	17	s := NewTargeted(TargetsSmallEpsilon)
18	18	b.ResetTimer()
19	19	for i := float64(0); i < float64(b.N); i++ {
20	20	s.Insert(i)

38	38	}
39	39
40	40	func BenchmarkQuery(b *testing.B) {
41		s := NewTargeted(Targets...)
	41	s := NewTargeted(Targets)
42	42	for i := float64(0); i < 1e6; i++ {
43	43	s.Insert(i)
44	44	}

50	50	}
51	51
52	52	func BenchmarkQuerySmallEpsilon(b *testing.B) {
53		s := NewTargeted(TargetsSmallEpsilon...)
	53	s := NewTargeted(TargetsSmallEpsilon)
54	54	for i := float64(0); i < 1e6; i++ {
55	55	s.Insert(i)
56	56	}

+11

-14

quantile/stream.go less more

33	33	func (a Samples) Less(i, j int) bool { return a[i].Value < a[j].Value }
34	34	func (a Samples) Swap(i, j int) { a[i], a[j] = a[j], a[i] }
35	35
36		// Target describes a quantile for a targeted stream together with its absolute
37		// error, i.e. the true quantile of a value returned by a query is guaranteed to
38		// be within (Quantile±Epsilon).
39		type Target struct {
40		Quantile float64
41		Epsilon float64
42		}
43
44	36	type invariant func(s *stream, r float64) float64
45	37
46	38	// NewLowBiased returns an initialized Stream for low-biased quantiles

79	71
80	72	// NewTargeted returns an initialized Stream concerned with a particular set of
81	73	// quantile values that are supplied a priori. Knowing these a priori reduces
82		// space and computation time.
	74	// space and computation time. The targets map maps the desired quantiles to
	75	// their absolute errors, i.e. the true quantile of a value returned by a query
	76	// is guaranteed to be within (Quantile±Epsilon).
83	77	//
84	78	// See http://www.cs.rutgers.edu/~muthu/bquant.pdf for time, space, and error properties.
85		func NewTargeted(targets ...Target) *Stream {
	79	func NewTargeted(targets map[float64]float64) *Stream {
86	80	ƒ := func(s *stream, r float64) float64 {
87	81	var m = math.MaxFloat64
88	82	var f float64
89		for _, t := range targets {
90		if t.Quantile*s.n <= r {
91		f = (2 * t.Epsilon * r) / t.Quantile
	83	for quantile, epsilon := range targets {
	84	if quantile*s.n <= r {
	85	f = (2 * epsilon * r) / quantile
92	86	} else {
93		f = (2 * t.Epsilon * (s.n - r)) / (1 - t.Quantile)
	87	f = (2 * epsilon * (s.n - r)) / (1 - quantile)
94	88	}
95	89	if f < m {
96	90	m = f

151	145
152	146	// Merge merges samples into the underlying streams samples. This is handy when
153	147	// merging multiple streams from separate threads, database shards, etc.
	148	//
	149	// ATTENTION: This method is broken and does not yield correct results. The
	150	// underlying algorithm is not capable of merging streams correctly.
154	151	func (s *Stream) Merge(samples Samples) {
155	152	sort.Sort(samples)
156	153	s.stream.merge(samples)

+28

-28

quantile/stream_test.go less more

7	7	)
8	8
9	9	var (
10		Targets = []Target{
11		{Quantile: 0.01, Epsilon: 0.001},
12		{Quantile: 0.10, Epsilon: 0.01},
13		{Quantile: 0.50, Epsilon: 0.05},
14		{Quantile: 0.90, Epsilon: 0.01},
15		{Quantile: 0.99, Epsilon: 0.001},
	10	Targets = map[float64]float64{
	11	0.01: 0.001,
	12	0.10: 0.01,
	13	0.50: 0.05,
	14	0.90: 0.01,
	15	0.99: 0.001,
16	16	}
17		TargetsSmallEpsilon = []Target{
18		{Quantile: 0.01, Epsilon: 0.0001},
19		{Quantile: 0.10, Epsilon: 0.001},
20		{Quantile: 0.50, Epsilon: 0.005},
21		{Quantile: 0.90, Epsilon: 0.001},
22		{Quantile: 0.99, Epsilon: 0.0001},
	17	TargetsSmallEpsilon = map[float64]float64{
	18	0.01: 0.0001,
	19	0.10: 0.001,
	20	0.50: 0.005,
	21	0.90: 0.001,
	22	0.99: 0.0001,
23	23	}
24	24	LowQuantiles = []float64{0.01, 0.1, 0.5}
25	25	HighQuantiles = []float64{0.99, 0.9, 0.5}

29	29
30	30	func verifyPercsWithAbsoluteEpsilon(t testing.T, a []float64, s Stream) {
31	31	sort.Float64s(a)
32		for _, tt := range Targets {
	32	for quantile, epsilon := range Targets {
33	33	n := float64(len(a))
34		k := int(tt.Quantile * n)
35		lower := int((tt.Quantile - tt.Epsilon) * n)
	34	k := int(quantile * n)
	35	lower := int((quantile - epsilon) * n)
36	36	if lower < 1 {
37	37	lower = 1
38	38	}
39		upper := int(math.Ceil((tt.Quantile + tt.Epsilon) * n))
	39	upper := int(math.Ceil((quantile + epsilon) * n))
40	40	if upper > len(a) {
41	41	upper = len(a)
42	42	}
43	43	w, min, max := a[k-1], a[lower-1], a[upper-1]
44		if g := s.Query(tt.Quantile); g < min \|\| g > max {
45		t.Errorf("q=%f: want %v [%f,%f], got %v", tt.Quantile, w, min, max, g)
	44	if g := s.Query(quantile); g < min \|\| g > max {
	45	t.Errorf("q=%f: want %v [%f,%f], got %v", quantile, w, min, max, g)
46	46	}
47	47	}
48	48	}

93	93
94	94	func TestTargetedQuery(t *testing.T) {
95	95	rand.Seed(42)
96		s := NewTargeted(Targets...)
	96	s := NewTargeted(Targets)
97	97	a := populateStream(s)
98	98	verifyPercsWithAbsoluteEpsilon(t, a, s)
99	99	}

114	114
115	115	func TestTargetedMerge(t *testing.T) {
116	116	rand.Seed(42)
117		s1 := NewTargeted(Targets...)
118		s2 := NewTargeted(Targets...)
	117	s1 := NewTargeted(Targets)
	118	s2 := NewTargeted(Targets)
119	119	a := populateStream(s1)
120	120	a = append(a, populateStream(s2)...)
121	121	s1.Merge(s2.Samples())

143	143	}
144	144
145	145	func TestUncompressed(t *testing.T) {
146		q := NewTargeted(Targets...)
	146	q := NewTargeted(Targets)
147	147	for i := 100; i > 0; i-- {
148	148	q.Insert(float64(i))
149	149	}

151	151	t.Errorf("want count 100, got %d", g)
152	152	}
153	153	// Before compression, Query should have 100% accuracy.
154		for _, tt := range Targets {
155		w := tt.Quantile * 100
156		if g := q.Query(tt.Quantile); g != w {
	154	for quantile := range Targets {
	155	w := quantile * 100
	156	if g := q.Query(quantile); g != w {
157	157	t.Errorf("want %f, got %f", w, g)
158	158	}
159	159	}
160	160	}
161	161
162	162	func TestUncompressedSamples(t *testing.T) {
163		q := NewTargeted(Target{0.99, 0.001})
	163	q := NewTargeted(map[float64]float64{0.99: 0.001})
164	164	for i := 1; i <= 100; i++ {
165	165	q.Insert(float64(i))
166	166	}

170	170	}
171	171
172	172	func TestUncompressedOne(t *testing.T) {
173		q := NewTargeted(Target{0.90, 0.01})
	173	q := NewTargeted(map[float64]float64{0.99: 0.01})
174	174	q.Insert(3.14)
175	175	if g := q.Query(0.90); g != 3.14 {
176	176	t.Error("want PI, got", g)

178	178	}
179	179
180	180	func TestDefaults(t *testing.T) {
181		if g := NewTargeted(Target{0.99, 0.001}).Query(0.99); g != 0 {
	181	if g := NewTargeted(map[float64]float64{0.99: 0.001}).Query(0.99); g != 0 {
182	182	t.Errorf("want 0, got %f", g)
183	183	}
184	184	}