handlers/memcached/batched/relay.go

// Copyright 2016 Netflix, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package batched

import (
	"math/rand"
	"sync"
	"sync/atomic"
	"time"

	"github.com/netflix/rend/metrics"
)

var (
	MetricBatchRelaysCreated         = metrics.AddCounter("batch_relay_created", nil)
	MetricBatchMonitorRuns           = metrics.AddCounter("batch_monitor_runs", nil)
	MetricBatchConnectionsCreated    = metrics.AddCounter("batch_connections_created", nil)
	MetricBatchConnectionFailure     = metrics.AddCounter("batch_connection_failure", nil)
	MetricBatchExpandLoadFactor      = metrics.AddCounter("batch_expand_load_factor", nil)
	MetricBatchExpandOverloadedRatio = metrics.AddCounter("batch_expand_overloaded_ratio", nil)

	MetricBatchPoolSize       = metrics.AddIntGauge("batch_pool_size", nil)
	MetricBatchLastLoadFactor = metrics.AddFloatGauge("batch_last_load_factor", nil)
)

var (
	relays    = make(map[string]*relay)
	relayLock = new(sync.RWMutex)
)

type relay struct {
	sock        string
	conns       atomic.Value
	addConnLock *sync.Mutex
	expand      chan struct{}
	opts        Opts
}

// Creates a new relay with one connection or returns an existing relay for the
// given socket.
func getRelay(sock string, opts Opts) *relay {
	relayLock.RLock()
	if r, ok := relays[sock]; ok {
		relayLock.RUnlock()
		return r
	}
	relayLock.RUnlock()

	// Lock here because we are creating a new relay for the given socket path
	// The rest of the new connections will block here and then pick it up on
	// the double check
	relayLock.Lock()

	// double check
	if r, ok := relays[sock]; ok {
		relayLock.Unlock()
		return r
	}

	metrics.IncCounter(MetricBatchRelaysCreated)

	// Create a new relay and wait for the first connection to be established
	// so it's usable.
	r := &relay{
		sock:        sock,
		conns:       atomic.Value{},
		addConnLock: new(sync.Mutex),
		//expand:      make(chan struct{}, 1),
		opts: opts,
	}

	// initialize the atomic value
	r.conns.Store(make([]*conn, 0))

	firstConnSetup := make(chan struct{})
	go r.monitor(firstConnSetup)
	<-firstConnSetup

	relays[sock] = r
	relayLock.Unlock()

	return r
}

// Adds a connection to the pool. This is one way only, making this effectively
// a high-water-mark pool with no connections being torn down.
func (r *relay) addConn() {
	// Ensure there's no races when adding a connection
	r.addConnLock.Lock()
	defer r.addConnLock.Unlock()

	temp := r.conns.Load().([]*conn)

	connID := uint32(len(temp))
	batchDelay := time.Duration(r.opts.BatchDelayMicros) * time.Microsecond
	poolconn := newConn(r.sock, connID, batchDelay, r.opts.BatchSize, r.opts.ReadBufSize, r.opts.WriteBufSize, r.expand)

	// Add the new connection (but with a new slice header)
	temp = append(temp, poolconn)

	// Store the modified slice
	r.conns.Store(temp)
}

// Submits a request to a random connection in the pool. The random number generator
// is passed in so there is no sharing between external connections.
func (r *relay) submit(rand *rand.Rand, req request) {
	// use rand to select a connection to submit to
	// the connection should notify the frontend by the channel
	// in the request struct
	cs := r.conns.Load().([]*conn)
	idx := rand.Intn(len(cs))
	c := cs[idx]
	c.reqchan <- req
}

func (r *relay) monitor(firstConnSetup chan struct{}) {
	// do monitoring stuff
	// keep track of queue depths
	// this will need some handles to all the connections
	// atomic swap 0 in to each high water mark gauge
	// take max of all of them
	// since batch size is universal, we can compare against that
	// if the historical trend (5 times checked?) is above, say, 80% of capacity
	// add another connection
	// maybe double if maxxed out and add a single if above a lower limit

	// create first connection and notify after it's complete
	r.addConn()
	firstConnSetup <- struct{}{}

	for {
		var shouldAdd bool

		// re-evaluate at regular interval regardless
		<-time.After(time.Duration(r.opts.EvaluationIntervalSec) * time.Second)
		metrics.IncCounter(MetricBatchMonitorRuns)

		/* off for now
		// Re-evaluate either after 30 seconds or when a connection notifies that
		// it is overloaded.
		select {
		case <-time.After(evaluationIntervalSec * time.Second):
			println("MONITOR TIMED OUT")
		case <-r.expand:
			println("NOTIFIED TO EXPAND")
			//shouldAdd = true
		}
		*/

		//println("MONITOR RUNNING")

		cs := r.conns.Load().([]*conn)
		/*
			maxes := make([]uint32, len(cs))

			// Extract the maximum batch sizes seen since the last check
			for i, c := range cs {
				maxes[i] = atomic.SwapUint32(c.maxBatchSize, 0)
				//println("MAX BATCH SIZE", i, maxes[i])
			}
		*/

		averages := make([]float64, len(cs))

		// Extract the packed average data and calculate all the averages
		for i, c := range cs {
			avgData := atomic.SwapUint64(c.avgBatchData, 0)
			numBatches := avgData >> 32
			numCmds := avgData & 0xFFFFFFFF
			var avg float64

			if numBatches != 0 {
				avg = float64(numCmds) / float64(numBatches)
			}

			averages[i] = avg
		}

		// Heuristic: calculate the percentage of the total batch capacity used on average
		var used float64
		for _, u := range averages {
			used += u
		}

		total := float64(len(cs)) * float64(r.opts.BatchSize)
		loadFactor := float64(used) / total

		metrics.SetFloatGauge(MetricBatchLastLoadFactor, loadFactor)

		// if we are over our load factor ratio
		if loadFactor > r.opts.LoadFactorExpandRatio {
			metrics.IncCounter(MetricBatchExpandLoadFactor)
			shouldAdd = true
		}

		// If a configurable percentage or absolute number of connections got
		// very close to their limit or hit it
		var numOverloaded int
		for _, m := range averages {
			if m >= float64(r.opts.BatchSize-1) {
				numOverloaded++
			}
		}

		if float64(numOverloaded)/float64(len(cs)) > r.opts.OverloadedConnRatio {
			metrics.IncCounter(MetricBatchExpandOverloadedRatio)
			shouldAdd = true
		}

		// add a connection if needed
		if shouldAdd {
			r.addConn()
			metrics.SetIntGauge(MetricBatchPoolSize, uint64(len(r.conns.Load().([]*conn))))
		}
	}
}