sail/pkg/xds/discovery.go - dubbo-kubernetes - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package xds

 import (
 	"fmt"
 	"github.com/apache/dubbo-kubernetes/pkg/cluster"
 	"github.com/apache/dubbo-kubernetes/pkg/config/schema/kind"
 	"github.com/apache/dubbo-kubernetes/pkg/kube/krt"
 	"github.com/apache/dubbo-kubernetes/sail/pkg/features"
 	"github.com/apache/dubbo-kubernetes/sail/pkg/model"
 	discovery "github.com/envoyproxy/go-control-plane/envoy/service/discovery/v3"
 	"go.uber.org/atomic"
 	"golang.org/x/time/rate"
 	"google.golang.org/grpc"
 	"k8s.io/klog/v2"
 	"strconv"
 	"sync"
 	"time"
 )

 type DebounceOptions struct {
 	DebounceAfter     time.Duration
 	debounceMax       time.Duration
 	enableEDSDebounce bool
 }

 type DiscoveryServer struct {
 	Env                 *model.Environment
 	serverReady         atomic.Bool
 	DiscoveryStartTime  time.Time
 	ClusterAliases      map[cluster.ID]cluster.ID
 	pushQueue           *PushQueue
 	krtDebugger         *krt.DebugHandler
 	InboundUpdates      *atomic.Int64
 	CommittedUpdates    *atomic.Int64
 	RequestRateLimit    *rate.Limiter
 	ProxyNeedsPush      func(proxy *model.Proxy, req *model.PushRequest) (*model.PushRequest, bool)
 	pushChannel         chan *model.PushRequest
 	DebounceOptions     DebounceOptions
 	concurrentPushLimit chan struct{}
 	adsClientsMutex     sync.RWMutex
 	adsClients          map[string]*Connection
 	Generators          map[string]model.XdsResourceGenerator
 	pushVersion         atomic.Uint64
 }

 var processStartTime = time.Now()

 func NewDiscoveryServer(env *model.Environment, clusterAliases map[string]string, debugger *krt.DebugHandler) *DiscoveryServer {
 	out := &DiscoveryServer{
 		Env:                 env,
 		Generators:          map[string]model.XdsResourceGenerator{},
 		krtDebugger:         debugger,
 		InboundUpdates:      atomic.NewInt64(0),
 		CommittedUpdates:    atomic.NewInt64(0),
 		concurrentPushLimit: make(chan struct{}, features.PushThrottle),
 		RequestRateLimit:    rate.NewLimiter(rate.Limit(features.RequestLimit), 1),
 		pushChannel:         make(chan *model.PushRequest, 10),
 		pushQueue:           NewPushQueue(),
 		DebounceOptions: DebounceOptions{
 			DebounceAfter:     features.DebounceAfter,
 			debounceMax:       features.DebounceMax,
 			enableEDSDebounce: features.EnableEDSDebounce,
 		},
 		adsClients:         map[string]*Connection{},
 		DiscoveryStartTime: processStartTime,
 	}

 	out.ClusterAliases = make(map[cluster.ID]cluster.ID)
 	for alias := range clusterAliases {
 		out.ClusterAliases[cluster.ID(alias)] = cluster.ID(clusterAliases[alias])
 	}
 	return out
 }

 func (s *DiscoveryServer) Register(rpcs *grpc.Server) {
 	// Register v3 server
 	discovery.RegisterAggregatedDiscoveryServiceServer(rpcs, s)
 }

 func (s *DiscoveryServer) Start(stopCh <-chan struct{}) {
 	go s.handleUpdates(stopCh)
 	go s.sendPushes(stopCh)
 }

 func (s *DiscoveryServer) CachesSynced() {
 	klog.Infof("All caches have been synced up in %v, marking server ready", time.Since(s.DiscoveryStartTime))
 	s.serverReady.Store(true)
 }

 func (s *DiscoveryServer) Shutdown() {
 	s.pushQueue.ShutDown()
 }

 func (s *DiscoveryServer) Push(req *model.PushRequest) {
 	if !req.Full {
 		req.Push = s.globalPushContext()
 		s.AdsPushAll(req)
 		return
 	}

 	// Reset the status during the push.
 	oldPushContext := s.globalPushContext()
 	if oldPushContext != nil {
 		oldPushContext.OnConfigChange()
 	}
 	// PushContext is reset after a config change. Previous status is
 	// saved.
 	versionLocal := s.NextVersion()
 	push := s.initPushContext(req, oldPushContext, versionLocal)
 	req.Push = push
 	s.AdsPushAll(req)
 }

 func (s *DiscoveryServer) initPushContext(req *model.PushRequest, oldPushContext *model.PushContext, version string) *model.PushContext {
 	push := model.NewPushContext()
 	push.InitContext(s.Env, oldPushContext, req)
 	s.Env.SetPushContext(push)
 	return push
 }

 func (s *DiscoveryServer) NextVersion() string {
 	return time.Now().Format(time.RFC3339) + "/" + strconv.FormatUint(s.pushVersion.Inc(), 10)
 }

 func (s *DiscoveryServer) globalPushContext() *model.PushContext {
 	return s.Env.PushContext()
 }

 func (s *DiscoveryServer) handleUpdates(stopCh <-chan struct{}) {
 	debounce(s.pushChannel, stopCh, s.DebounceOptions, s.Push, s.CommittedUpdates)
 }

 func (s *DiscoveryServer) sendPushes(stopCh <-chan struct{}) {
 	doSendPushes(stopCh, s.concurrentPushLimit, s.pushQueue)
 }

 func (s *DiscoveryServer) ConfigUpdate(req *model.PushRequest) {
 	if model.HasConfigsOfKind(req.ConfigsUpdated, kind.Address) {
 		// TODO ClearAll
 	}
 	s.InboundUpdates.Inc()

 	s.pushChannel <- req
 }

 func (s *DiscoveryServer) IsServerReady() bool {
 	return s.serverReady.Load()
 }

 func reasonsUpdated(req *model.PushRequest) string {
 	var (
 		reason0, reason1            model.TriggerReason
 		reason0Cnt, reason1Cnt, idx int
 	)
 	for r, cnt := range req.Reason {
 		if idx == 0 {
 			reason0, reason0Cnt = r, cnt
 		} else if idx == 1 {
 			reason1, reason1Cnt = r, cnt
 		} else {
 			break
 		}
 		idx++
 	}

 	switch len(req.Reason) {
 	case 0:
 		return "unknown"
 	case 1:
 		return fmt.Sprintf("%s:%d", reason0, reason0Cnt)
 	case 2:
 		return fmt.Sprintf("%s:%d and %s:%d", reason0, reason0Cnt, reason1, reason1Cnt)
 	default:
 		return fmt.Sprintf("%s:%d and %d(%d) more reasons", reason0, reason0Cnt, len(req.Reason)-1,
 			req.Reason.Count()-reason0Cnt)
 	}
 }

 func configsUpdated(req *model.PushRequest) string {
 	configs := ""
 	for key := range req.ConfigsUpdated {
 		configs += key.String()
 		break
 	}
 	if len(req.ConfigsUpdated) > 1 {
 		more := " and " + strconv.Itoa(len(req.ConfigsUpdated)-1) + " more configs"
 		configs += more
 	}

 	return configs
 }

 func debounce(ch chan *model.PushRequest, stopCh <-chan struct{}, opts DebounceOptions, pushFn func(req *model.PushRequest), updateSent *atomic.Int64) {
 	var timeChan <-chan time.Time
 	var startDebounce time.Time
 	var lastConfigUpdateTime time.Time

 	pushCounter := 0
 	debouncedEvents := 0

 	var req *model.PushRequest
 	free := true
 	freeCh := make(chan struct{}, 1)

 	push := func(req *model.PushRequest, debouncedEvents int, startDebounce time.Time) {
 		pushFn(req)
 		updateSent.Add(int64(debouncedEvents))
 		freeCh <- struct{}{}
 	}

 	pushWorker := func() {
 		eventDelay := time.Since(startDebounce)
 		quietTime := time.Since(lastConfigUpdateTime)
 		// it has been too long or quiet enough
 		if eventDelay >= opts.debounceMax || quietTime >= opts.DebounceAfter {
 			if req != nil {
 				pushCounter++
 				if req.ConfigsUpdated == nil {
 					klog.Infof("Push debounce stable[%d] %d for reason %s: %v since last change, %v since last push, full=%v",
 						pushCounter, debouncedEvents, reasonsUpdated(req),
 						quietTime, eventDelay, req.Full)
 				} else {
 					klog.Infof("Push debounce stable[%d] %d for config %s: %v since last change, %v since last push, full=%v",
 						pushCounter, debouncedEvents, configsUpdated(req),
 						quietTime, eventDelay, req.Full)
 				}
 				free = false
 				go push(req, debouncedEvents, startDebounce)
 				req = nil
 				debouncedEvents = 0
 			}
 		} else {
 			timeChan = time.After(opts.DebounceAfter - quietTime)
 		}
 	}

 	for {
 		select {
 		case <-freeCh:
 			free = true
 			pushWorker()
 		case r := <-ch:
 			// If reason is not set, record it as an unknown reason
 			if len(r.Reason) == 0 {
 				r.Reason = model.NewReasonStats(model.UnknownTrigger)
 			}
 			if !opts.enableEDSDebounce && !r.Full {
 				// trigger push now, just for EDS
 				go func(req *model.PushRequest) {
 					pushFn(req)
 					updateSent.Inc()
 				}(r)
 				continue
 			}

 			lastConfigUpdateTime = time.Now()
 			if debouncedEvents == 0 {
 				timeChan = time.After(opts.DebounceAfter)
 				startDebounce = lastConfigUpdateTime
 			}
 			debouncedEvents++

 			req = req.Merge(r)
 		case <-timeChan:
 			if free {
 				pushWorker()
 			}
 		case <-stopCh:
 			return
 		}
 	}
 }

 func doSendPushes(stopCh <-chan struct{}, semaphore chan struct{}, queue *PushQueue) {
 	for {
 		select {
 		case <-stopCh:
 			return
 		default:
 			semaphore <- struct{}{}

 			// Get the next proxy to push. This will block if there are no updates required.
 			client, push, shuttingdown := queue.Dequeue()
 			if shuttingdown {
 				return
 			}
 			doneFunc := func() {
 				queue.MarkDone(client)
 				<-semaphore
 			}

 			var closed <-chan struct{}
 			if client.deltaStream != nil {
 				closed = client.deltaStream.Context().Done()
 			} else {
 				closed = client.StreamDone()
 			}
 			go func() {
 				pushEv := &Event{
 					pushRequest: push,
 					done:        doneFunc,
 				}

 				select {
 				case client.PushCh() <- pushEv:
 					return
 				case <-closed: // grpc stream was closed
 					doneFunc()
 					klog.Infof("Client closed connection %v", client.ID())
 				}
 			}()
 		}
 	}
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package xds

	import (
	"fmt"
	"github.com/apache/dubbo-kubernetes/pkg/cluster"
	"github.com/apache/dubbo-kubernetes/pkg/config/schema/kind"
	"github.com/apache/dubbo-kubernetes/pkg/kube/krt"
	"github.com/apache/dubbo-kubernetes/sail/pkg/features"
	"github.com/apache/dubbo-kubernetes/sail/pkg/model"
	discovery "github.com/envoyproxy/go-control-plane/envoy/service/discovery/v3"
	"go.uber.org/atomic"
	"golang.org/x/time/rate"
	"google.golang.org/grpc"
	"k8s.io/klog/v2"
	"strconv"
	"sync"
	"time"
	)

	type DebounceOptions struct {
	DebounceAfter time.Duration
	debounceMax time.Duration
	enableEDSDebounce bool
	}

	type DiscoveryServer struct {
	Env *model.Environment
	serverReady atomic.Bool
	DiscoveryStartTime time.Time
	ClusterAliases map[cluster.ID]cluster.ID
	pushQueue *PushQueue
	krtDebugger *krt.DebugHandler
	InboundUpdates *atomic.Int64
	CommittedUpdates *atomic.Int64
	RequestRateLimit *rate.Limiter
	ProxyNeedsPush func(proxy model.Proxy, req model.PushRequest) (*model.PushRequest, bool)
	pushChannel chan *model.PushRequest
	DebounceOptions DebounceOptions
	concurrentPushLimit chan struct{}
	adsClientsMutex sync.RWMutex
	adsClients map[string]*Connection
	Generators map[string]model.XdsResourceGenerator
	pushVersion atomic.Uint64
	}

	var processStartTime = time.Now()

	func NewDiscoveryServer(env model.Environment, clusterAliases map[string]string, debugger krt.DebugHandler) *DiscoveryServer {
	out := &DiscoveryServer{
	Env: env,
	Generators: map[string]model.XdsResourceGenerator{},
	krtDebugger: debugger,
	InboundUpdates: atomic.NewInt64(0),
	CommittedUpdates: atomic.NewInt64(0),
	concurrentPushLimit: make(chan struct{}, features.PushThrottle),
	RequestRateLimit: rate.NewLimiter(rate.Limit(features.RequestLimit), 1),
	pushChannel: make(chan *model.PushRequest, 10),
	pushQueue: NewPushQueue(),
	DebounceOptions: DebounceOptions{
	DebounceAfter: features.DebounceAfter,
	debounceMax: features.DebounceMax,
	enableEDSDebounce: features.EnableEDSDebounce,
	},
	adsClients: map[string]*Connection{},
	DiscoveryStartTime: processStartTime,
	}

	out.ClusterAliases = make(map[cluster.ID]cluster.ID)
	for alias := range clusterAliases {
	out.ClusterAliases[cluster.ID(alias)] = cluster.ID(clusterAliases[alias])
	}
	return out
	}

	func (s DiscoveryServer) Register(rpcs grpc.Server) {
	// Register v3 server
	discovery.RegisterAggregatedDiscoveryServiceServer(rpcs, s)
	}

	func (s *DiscoveryServer) Start(stopCh <-chan struct{}) {
	go s.handleUpdates(stopCh)
	go s.sendPushes(stopCh)
	}

	func (s *DiscoveryServer) CachesSynced() {
	klog.Infof("All caches have been synced up in %v, marking server ready", time.Since(s.DiscoveryStartTime))
	s.serverReady.Store(true)
	}

	func (s *DiscoveryServer) Shutdown() {
	s.pushQueue.ShutDown()
	}

	func (s DiscoveryServer) Push(req model.PushRequest) {
	if !req.Full {
	req.Push = s.globalPushContext()
	s.AdsPushAll(req)
	return
	}

	// Reset the status during the push.
	oldPushContext := s.globalPushContext()
	if oldPushContext != nil {
	oldPushContext.OnConfigChange()
	}
	// PushContext is reset after a config change. Previous status is
	// saved.
	versionLocal := s.NextVersion()
	push := s.initPushContext(req, oldPushContext, versionLocal)
	req.Push = push
	s.AdsPushAll(req)
	}

	func (s DiscoveryServer) initPushContext(req model.PushRequest, oldPushContext model.PushContext, version string) model.PushContext {
	push := model.NewPushContext()
	push.InitContext(s.Env, oldPushContext, req)
	s.Env.SetPushContext(push)
	return push
	}

	func (s *DiscoveryServer) NextVersion() string {
	return time.Now().Format(time.RFC3339) + "/" + strconv.FormatUint(s.pushVersion.Inc(), 10)
	}

	func (s DiscoveryServer) globalPushContext() model.PushContext {
	return s.Env.PushContext()
	}

	func (s *DiscoveryServer) handleUpdates(stopCh <-chan struct{}) {
	debounce(s.pushChannel, stopCh, s.DebounceOptions, s.Push, s.CommittedUpdates)
	}

	func (s *DiscoveryServer) sendPushes(stopCh <-chan struct{}) {
	doSendPushes(stopCh, s.concurrentPushLimit, s.pushQueue)
	}

	func (s DiscoveryServer) ConfigUpdate(req model.PushRequest) {
	if model.HasConfigsOfKind(req.ConfigsUpdated, kind.Address) {
	// TODO ClearAll
	}
	s.InboundUpdates.Inc()

	s.pushChannel <- req
	}

	func (s *DiscoveryServer) IsServerReady() bool {
	return s.serverReady.Load()
	}

	func reasonsUpdated(req *model.PushRequest) string {
	var (
	reason0, reason1 model.TriggerReason
	reason0Cnt, reason1Cnt, idx int
	)
	for r, cnt := range req.Reason {
	if idx == 0 {
	reason0, reason0Cnt = r, cnt
	} else if idx == 1 {
	reason1, reason1Cnt = r, cnt
	} else {
	break
	}
	idx++
	}

	switch len(req.Reason) {
	case 0:
	return "unknown"
	case 1:
	return fmt.Sprintf("%s:%d", reason0, reason0Cnt)
	case 2:
	return fmt.Sprintf("%s:%d and %s:%d", reason0, reason0Cnt, reason1, reason1Cnt)
	default:
	return fmt.Sprintf("%s:%d and %d(%d) more reasons", reason0, reason0Cnt, len(req.Reason)-1,
	req.Reason.Count()-reason0Cnt)
	}
	}

	func configsUpdated(req *model.PushRequest) string {
	configs := ""
	for key := range req.ConfigsUpdated {
	configs += key.String()
	break
	}
	if len(req.ConfigsUpdated) > 1 {
	more := " and " + strconv.Itoa(len(req.ConfigsUpdated)-1) + " more configs"
	configs += more
	}

	return configs
	}

	func debounce(ch chan model.PushRequest, stopCh <-chan struct{}, opts DebounceOptions, pushFn func(req model.PushRequest), updateSent *atomic.Int64) {
	var timeChan <-chan time.Time
	var startDebounce time.Time
	var lastConfigUpdateTime time.Time

	pushCounter := 0
	debouncedEvents := 0

	var req *model.PushRequest
	free := true
	freeCh := make(chan struct{}, 1)

	push := func(req *model.PushRequest, debouncedEvents int, startDebounce time.Time) {
	pushFn(req)
	updateSent.Add(int64(debouncedEvents))
	freeCh <- struct{}{}
	}

	pushWorker := func() {
	eventDelay := time.Since(startDebounce)
	quietTime := time.Since(lastConfigUpdateTime)
	// it has been too long or quiet enough
	if eventDelay >= opts.debounceMax \|\| quietTime >= opts.DebounceAfter {
	if req != nil {
	pushCounter++
	if req.ConfigsUpdated == nil {
	klog.Infof("Push debounce stable[%d] %d for reason %s: %v since last change, %v since last push, full=%v",
	pushCounter, debouncedEvents, reasonsUpdated(req),
	quietTime, eventDelay, req.Full)
	} else {
	klog.Infof("Push debounce stable[%d] %d for config %s: %v since last change, %v since last push, full=%v",
	pushCounter, debouncedEvents, configsUpdated(req),
	quietTime, eventDelay, req.Full)
	}
	free = false
	go push(req, debouncedEvents, startDebounce)
	req = nil
	debouncedEvents = 0
	}
	} else {
	timeChan = time.After(opts.DebounceAfter - quietTime)
	}
	}

	for {
	select {
	case <-freeCh:
	free = true
	pushWorker()
	case r := <-ch:
	// If reason is not set, record it as an unknown reason
	if len(r.Reason) == 0 {
	r.Reason = model.NewReasonStats(model.UnknownTrigger)
	}
	if !opts.enableEDSDebounce && !r.Full {
	// trigger push now, just for EDS
	go func(req *model.PushRequest) {
	pushFn(req)
	updateSent.Inc()
	}(r)
	continue
	}

	lastConfigUpdateTime = time.Now()
	if debouncedEvents == 0 {
	timeChan = time.After(opts.DebounceAfter)
	startDebounce = lastConfigUpdateTime
	}
	debouncedEvents++

	req = req.Merge(r)
	case <-timeChan:
	if free {
	pushWorker()
	}
	case <-stopCh:
	return
	}
	}
	}

	func doSendPushes(stopCh <-chan struct{}, semaphore chan struct{}, queue *PushQueue) {
	for {
	select {
	case <-stopCh:
	return
	default:
	semaphore <- struct{}{}

	// Get the next proxy to push. This will block if there are no updates required.
	client, push, shuttingdown := queue.Dequeue()
	if shuttingdown {
	return
	}
	doneFunc := func() {
	queue.MarkDone(client)
	<-semaphore
	}

	var closed <-chan struct{}
	if client.deltaStream != nil {
	closed = client.deltaStream.Context().Done()
	} else {
	closed = client.StreamDone()
	}
	go func() {
	pushEv := &Event{
	pushRequest: push,
	done: doneFunc,
	}

	select {
	case client.PushCh() <- pushEv:
	return
	case <-closed: // grpc stream was closed
	doneFunc()
	klog.Infof("Client closed connection %v", client.ID())
	}
	}()
	}
	}
	}