563768b58a
* Move to v3 Co-authored-by: Ben Toogood <bentoogood@gmail.com>
519 lines
9.5 KiB
Go
519 lines
9.5 KiB
Go
// Package cache provides a registry cache
|
|
package cache
|
|
|
|
import (
|
|
"math"
|
|
"math/rand"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/micro/go-micro/v3/logger"
|
|
"github.com/micro/go-micro/v3/registry"
|
|
util "github.com/micro/go-micro/v3/util/registry"
|
|
)
|
|
|
|
// Cache is the registry cache interface
|
|
type Cache interface {
|
|
// embed the registry interface
|
|
registry.Registry
|
|
// stop the cache watcher
|
|
Stop()
|
|
}
|
|
|
|
type Options struct {
|
|
// TTL is the cache TTL
|
|
TTL time.Duration
|
|
}
|
|
|
|
type Option func(o *Options)
|
|
|
|
type cache struct {
|
|
registry.Registry
|
|
opts Options
|
|
|
|
// registry cache. services,ttls,watched,running are grouped by doman
|
|
sync.RWMutex
|
|
services map[string]services
|
|
ttls map[string]ttls
|
|
watched map[string]watched
|
|
running map[string]bool
|
|
|
|
// used to stop the caches
|
|
exit chan bool
|
|
|
|
// indicate whether its running status of the registry used to hold onto the cache in failure state
|
|
status error
|
|
}
|
|
|
|
type services map[string][]*registry.Service
|
|
type ttls map[string]time.Time
|
|
type watched map[string]bool
|
|
|
|
var defaultTTL = time.Minute
|
|
|
|
func backoff(attempts int) time.Duration {
|
|
if attempts == 0 {
|
|
return time.Duration(0)
|
|
}
|
|
return time.Duration(math.Pow(10, float64(attempts))) * time.Millisecond
|
|
}
|
|
|
|
func (c *cache) getStatus() error {
|
|
c.RLock()
|
|
defer c.RUnlock()
|
|
return c.status
|
|
}
|
|
|
|
func (c *cache) setStatus(err error) {
|
|
c.Lock()
|
|
c.status = err
|
|
c.Unlock()
|
|
}
|
|
|
|
// isValid checks if the service is valid
|
|
func (c *cache) isValid(services []*registry.Service, ttl time.Time) bool {
|
|
// no services exist
|
|
if len(services) == 0 {
|
|
return false
|
|
}
|
|
|
|
// ttl is invalid
|
|
if ttl.IsZero() {
|
|
return false
|
|
}
|
|
|
|
// time since ttl is longer than timeout
|
|
if time.Since(ttl) > 0 {
|
|
return false
|
|
}
|
|
|
|
// ok
|
|
return true
|
|
}
|
|
|
|
func (c *cache) quit() bool {
|
|
select {
|
|
case <-c.exit:
|
|
return true
|
|
default:
|
|
return false
|
|
}
|
|
}
|
|
|
|
func (c *cache) del(domain, service string) {
|
|
// don't blow away cache in error state
|
|
if err := c.getStatus(); err != nil {
|
|
return
|
|
}
|
|
|
|
c.Lock()
|
|
defer c.Unlock()
|
|
|
|
if _, ok := c.services[domain]; ok {
|
|
delete(c.services[domain], service)
|
|
}
|
|
|
|
if _, ok := c.ttls[domain]; ok {
|
|
delete(c.ttls[domain], service)
|
|
}
|
|
}
|
|
|
|
func (c *cache) get(domain, service string) ([]*registry.Service, error) {
|
|
var services []*registry.Service
|
|
var ttl time.Time
|
|
|
|
// lookup the values in the cache before calling the underlying registrry
|
|
c.RLock()
|
|
if srvs, ok := c.services[domain]; ok {
|
|
services = srvs[service]
|
|
}
|
|
if tt, ok := c.ttls[domain]; ok {
|
|
ttl = tt[service]
|
|
}
|
|
c.RUnlock()
|
|
|
|
// got services && within ttl so return a copy of the services
|
|
if c.isValid(services, ttl) {
|
|
return util.Copy(services), nil
|
|
}
|
|
|
|
// get does the actual request for a service and cache it
|
|
get := func(domain string, service string, cached []*registry.Service) ([]*registry.Service, error) {
|
|
// ask the registry
|
|
services, err := c.Registry.GetService(service, registry.GetDomain(domain))
|
|
if err != nil {
|
|
// set the error status
|
|
c.setStatus(err)
|
|
|
|
// check the cache
|
|
if len(cached) > 0 {
|
|
return cached, nil
|
|
}
|
|
|
|
// otherwise return error
|
|
return nil, err
|
|
}
|
|
|
|
// reset the status
|
|
if err := c.getStatus(); err != nil {
|
|
c.setStatus(nil)
|
|
}
|
|
|
|
// cache results
|
|
c.set(domain, service, util.Copy(services))
|
|
|
|
return services, nil
|
|
}
|
|
|
|
// watch service if not watched
|
|
c.RLock()
|
|
var ok bool
|
|
if _, d := c.watched[domain]; d {
|
|
if _, s := c.watched[domain][service]; s {
|
|
ok = true
|
|
}
|
|
}
|
|
c.RUnlock()
|
|
|
|
// check if its being watched
|
|
if !ok {
|
|
c.Lock()
|
|
|
|
// add domain if not registered
|
|
if _, ok := c.watched[domain]; !ok {
|
|
c.watched[domain] = make(map[string]bool)
|
|
}
|
|
|
|
// set to watched
|
|
c.watched[domain][service] = true
|
|
|
|
running := c.running[domain]
|
|
c.Unlock()
|
|
|
|
// only kick it off if not running
|
|
if !running {
|
|
go c.run(domain)
|
|
}
|
|
}
|
|
|
|
// get and return services
|
|
return get(domain, service, services)
|
|
}
|
|
|
|
func (c *cache) set(domain string, service string, srvs []*registry.Service) {
|
|
c.Lock()
|
|
defer c.Unlock()
|
|
|
|
if _, ok := c.services[domain]; !ok {
|
|
c.services[domain] = make(services)
|
|
}
|
|
if _, ok := c.ttls[domain]; !ok {
|
|
c.ttls[domain] = make(ttls)
|
|
}
|
|
|
|
c.services[domain][service] = srvs
|
|
c.ttls[domain][service] = time.Now().Add(c.opts.TTL)
|
|
}
|
|
|
|
func (c *cache) update(domain string, res *registry.Result) {
|
|
if res == nil || res.Service == nil {
|
|
return
|
|
}
|
|
|
|
// only save watched services since the service using the cache may only depend on a handful
|
|
// of other services
|
|
c.RLock()
|
|
if _, ok := c.watched[res.Service.Name]; !ok {
|
|
c.RUnlock()
|
|
return
|
|
}
|
|
|
|
// we're not going to cache anything unless there was already a lookup
|
|
services, ok := c.services[domain][res.Service.Name]
|
|
if !ok {
|
|
c.RUnlock()
|
|
return
|
|
}
|
|
|
|
c.RUnlock()
|
|
|
|
if len(res.Service.Nodes) == 0 {
|
|
switch res.Action {
|
|
case "delete":
|
|
c.del(domain, res.Service.Name)
|
|
}
|
|
return
|
|
}
|
|
|
|
// existing service found
|
|
var service *registry.Service
|
|
var index int
|
|
for i, s := range services {
|
|
if s.Version == res.Service.Version {
|
|
service = s
|
|
index = i
|
|
}
|
|
}
|
|
|
|
switch res.Action {
|
|
case "create", "update":
|
|
if service == nil {
|
|
c.set(domain, res.Service.Name, append(services, res.Service))
|
|
return
|
|
}
|
|
|
|
// append old nodes to new service
|
|
for _, cur := range service.Nodes {
|
|
var seen bool
|
|
for _, node := range res.Service.Nodes {
|
|
if cur.Id == node.Id {
|
|
seen = true
|
|
break
|
|
}
|
|
}
|
|
if !seen {
|
|
res.Service.Nodes = append(res.Service.Nodes, cur)
|
|
}
|
|
}
|
|
|
|
services[index] = res.Service
|
|
c.set(domain, res.Service.Name, services)
|
|
case "delete":
|
|
if service == nil {
|
|
return
|
|
}
|
|
|
|
var nodes []*registry.Node
|
|
|
|
// filter cur nodes to remove the dead one
|
|
for _, cur := range service.Nodes {
|
|
var seen bool
|
|
for _, del := range res.Service.Nodes {
|
|
if del.Id == cur.Id {
|
|
seen = true
|
|
break
|
|
}
|
|
}
|
|
if !seen {
|
|
nodes = append(nodes, cur)
|
|
}
|
|
}
|
|
|
|
// still got nodes, save and return
|
|
if len(nodes) > 0 {
|
|
service.Nodes = nodes
|
|
services[index] = service
|
|
c.set(domain, service.Name, services)
|
|
return
|
|
}
|
|
|
|
// zero nodes left
|
|
|
|
// only have one thing to delete
|
|
// nuke the thing
|
|
if len(services) == 1 {
|
|
c.del(domain, service.Name)
|
|
return
|
|
}
|
|
|
|
// still have more than 1 service
|
|
// check the version and keep what we know
|
|
var srvs []*registry.Service
|
|
for _, s := range services {
|
|
if s.Version != service.Version {
|
|
srvs = append(srvs, s)
|
|
}
|
|
}
|
|
|
|
// save
|
|
c.set(domain, service.Name, srvs)
|
|
}
|
|
}
|
|
|
|
// run starts the cache watcher loop
|
|
// it creates a new watcher if there's a problem
|
|
func (c *cache) run(domain string) {
|
|
c.Lock()
|
|
c.running[domain] = true
|
|
c.Unlock()
|
|
|
|
// reset watcher on exit
|
|
defer func() {
|
|
c.Lock()
|
|
c.watched[domain] = make(map[string]bool)
|
|
c.running[domain] = false
|
|
c.Unlock()
|
|
}()
|
|
|
|
var a, b int
|
|
|
|
for {
|
|
// exit early if already dead
|
|
if c.quit() {
|
|
return
|
|
}
|
|
|
|
// jitter before starting
|
|
j := rand.Int63n(100)
|
|
time.Sleep(time.Duration(j) * time.Millisecond)
|
|
|
|
// create new watcher
|
|
w, err := c.Registry.Watch(registry.WatchDomain(domain))
|
|
if err != nil {
|
|
if c.quit() {
|
|
return
|
|
}
|
|
|
|
d := backoff(a)
|
|
c.setStatus(err)
|
|
|
|
if a > 3 {
|
|
if logger.V(logger.DebugLevel, logger.DefaultLogger) {
|
|
logger.Debug("rcache: ", err, " backing off ", d)
|
|
}
|
|
a = 0
|
|
}
|
|
|
|
time.Sleep(d)
|
|
a++
|
|
|
|
continue
|
|
}
|
|
|
|
// reset a
|
|
a = 0
|
|
|
|
// watch for events
|
|
if err := c.watch(domain, w); err != nil {
|
|
if c.quit() {
|
|
return
|
|
}
|
|
|
|
d := backoff(b)
|
|
c.setStatus(err)
|
|
|
|
if b > 3 {
|
|
if logger.V(logger.DebugLevel, logger.DefaultLogger) {
|
|
logger.Debug("rcache: ", err, " backing off ", d)
|
|
}
|
|
b = 0
|
|
}
|
|
|
|
time.Sleep(d)
|
|
b++
|
|
|
|
continue
|
|
}
|
|
|
|
// reset b
|
|
b = 0
|
|
}
|
|
}
|
|
|
|
// watch loops the next event and calls update
|
|
// it returns if there's an error
|
|
func (c *cache) watch(domain string, w registry.Watcher) error {
|
|
// used to stop the watch
|
|
stop := make(chan bool)
|
|
|
|
// manage this loop
|
|
go func() {
|
|
defer w.Stop()
|
|
|
|
select {
|
|
// wait for exit
|
|
case <-c.exit:
|
|
return
|
|
// we've been stopped
|
|
case <-stop:
|
|
return
|
|
}
|
|
}()
|
|
|
|
for {
|
|
res, err := w.Next()
|
|
if err != nil {
|
|
close(stop)
|
|
return err
|
|
}
|
|
|
|
// reset the error status since we succeeded
|
|
if err := c.getStatus(); err != nil {
|
|
// reset status
|
|
c.setStatus(nil)
|
|
}
|
|
|
|
// for wildcard queries, the domain will be * and not the services domain, so we'll check to
|
|
// see if it was provided in the metadata.
|
|
dom := domain
|
|
if res.Service.Metadata != nil && len(res.Service.Metadata["domain"]) > 0 {
|
|
dom = res.Service.Metadata["domain"]
|
|
}
|
|
|
|
c.update(dom, res)
|
|
}
|
|
}
|
|
|
|
func (c *cache) GetService(service string, opts ...registry.GetOption) ([]*registry.Service, error) {
|
|
// parse the options, fallback to the default domain
|
|
var options registry.GetOptions
|
|
for _, o := range opts {
|
|
o(&options)
|
|
}
|
|
if len(options.Domain) == 0 {
|
|
options.Domain = registry.DefaultDomain
|
|
}
|
|
|
|
// get the service
|
|
services, err := c.get(options.Domain, service)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// if there's nothing return err
|
|
if len(services) == 0 {
|
|
return nil, registry.ErrNotFound
|
|
}
|
|
|
|
// return services
|
|
return services, nil
|
|
}
|
|
|
|
func (c *cache) Stop() {
|
|
c.Lock()
|
|
defer c.Unlock()
|
|
|
|
select {
|
|
case <-c.exit:
|
|
return
|
|
default:
|
|
close(c.exit)
|
|
}
|
|
}
|
|
|
|
func (c *cache) String() string {
|
|
return "cache"
|
|
}
|
|
|
|
// New returns a new cache
|
|
func New(r registry.Registry, opts ...Option) Cache {
|
|
rand.Seed(time.Now().UnixNano())
|
|
options := Options{
|
|
TTL: defaultTTL,
|
|
}
|
|
|
|
for _, o := range opts {
|
|
o(&options)
|
|
}
|
|
|
|
return &cache{
|
|
Registry: r,
|
|
opts: options,
|
|
running: make(map[string]bool),
|
|
watched: make(map[string]watched),
|
|
services: make(map[string]services),
|
|
ttls: make(map[string]ttls),
|
|
exit: make(chan bool),
|
|
}
|
|
}
|