123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902 |
- /*
- Copyright 2014 The Kubernetes Authors.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- */
- package cache
- import (
- "context"
- "errors"
- "fmt"
- "io"
- "math/rand"
- "os"
- "reflect"
- "strings"
- "sync"
- "time"
- apierrors "k8s.io/apimachinery/pkg/api/errors"
- "k8s.io/apimachinery/pkg/api/meta"
- metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
- "k8s.io/apimachinery/pkg/apis/meta/v1/unstructured"
- "k8s.io/apimachinery/pkg/runtime"
- "k8s.io/apimachinery/pkg/runtime/schema"
- "k8s.io/apimachinery/pkg/util/naming"
- utilnet "k8s.io/apimachinery/pkg/util/net"
- utilruntime "k8s.io/apimachinery/pkg/util/runtime"
- "k8s.io/apimachinery/pkg/util/wait"
- "k8s.io/apimachinery/pkg/watch"
- "k8s.io/client-go/tools/pager"
- "k8s.io/klog/v2"
- "k8s.io/utils/clock"
- "k8s.io/utils/pointer"
- "k8s.io/utils/trace"
- )
- const defaultExpectedTypeName = "<unspecified>"
- // Reflector watches a specified resource and causes all changes to be reflected in the given store.
- type Reflector struct {
- // name identifies this reflector. By default it will be a file:line if possible.
- name string
- // The name of the type we expect to place in the store. The name
- // will be the stringification of expectedGVK if provided, and the
- // stringification of expectedType otherwise. It is for display
- // only, and should not be used for parsing or comparison.
- typeDescription string
- // An example object of the type we expect to place in the store.
- // Only the type needs to be right, except that when that is
- // `unstructured.Unstructured` the object's `"apiVersion"` and
- // `"kind"` must also be right.
- expectedType reflect.Type
- // The GVK of the object we expect to place in the store if unstructured.
- expectedGVK *schema.GroupVersionKind
- // The destination to sync up with the watch source
- store Store
- // listerWatcher is used to perform lists and watches.
- listerWatcher ListerWatcher
- // backoff manages backoff of ListWatch
- backoffManager wait.BackoffManager
- resyncPeriod time.Duration
- // clock allows tests to manipulate time
- clock clock.Clock
- // paginatedResult defines whether pagination should be forced for list calls.
- // It is set based on the result of the initial list call.
- paginatedResult bool
- // lastSyncResourceVersion is the resource version token last
- // observed when doing a sync with the underlying store
- // it is thread safe, but not synchronized with the underlying store
- lastSyncResourceVersion string
- // isLastSyncResourceVersionUnavailable is true if the previous list or watch request with
- // lastSyncResourceVersion failed with an "expired" or "too large resource version" error.
- isLastSyncResourceVersionUnavailable bool
- // lastSyncResourceVersionMutex guards read/write access to lastSyncResourceVersion
- lastSyncResourceVersionMutex sync.RWMutex
- // Called whenever the ListAndWatch drops the connection with an error.
- watchErrorHandler WatchErrorHandler
- // WatchListPageSize is the requested chunk size of initial and resync watch lists.
- // If unset, for consistent reads (RV="") or reads that opt-into arbitrarily old data
- // (RV="0") it will default to pager.PageSize, for the rest (RV != "" && RV != "0")
- // it will turn off pagination to allow serving them from watch cache.
- // NOTE: It should be used carefully as paginated lists are always served directly from
- // etcd, which is significantly less efficient and may lead to serious performance and
- // scalability problems.
- WatchListPageSize int64
- // ShouldResync is invoked periodically and whenever it returns `true` the Store's Resync operation is invoked
- ShouldResync func() bool
- // MaxInternalErrorRetryDuration defines how long we should retry internal errors returned by watch.
- MaxInternalErrorRetryDuration time.Duration
- // UseWatchList if turned on instructs the reflector to open a stream to bring data from the API server.
- // Streaming has the primary advantage of using fewer server's resources to fetch data.
- //
- // The old behaviour establishes a LIST request which gets data in chunks.
- // Paginated list is less efficient and depending on the actual size of objects
- // might result in an increased memory consumption of the APIServer.
- //
- // See https://github.com/kubernetes/enhancements/tree/master/keps/sig-api-machinery/3157-watch-list#design-details
- UseWatchList bool
- }
- // ResourceVersionUpdater is an interface that allows store implementation to
- // track the current resource version of the reflector. This is especially
- // important if storage bookmarks are enabled.
- type ResourceVersionUpdater interface {
- // UpdateResourceVersion is called each time current resource version of the reflector
- // is updated.
- UpdateResourceVersion(resourceVersion string)
- }
- // The WatchErrorHandler is called whenever ListAndWatch drops the
- // connection with an error. After calling this handler, the informer
- // will backoff and retry.
- //
- // The default implementation looks at the error type and tries to log
- // the error message at an appropriate level.
- //
- // Implementations of this handler may display the error message in other
- // ways. Implementations should return quickly - any expensive processing
- // should be offloaded.
- type WatchErrorHandler func(r *Reflector, err error)
- // DefaultWatchErrorHandler is the default implementation of WatchErrorHandler
- func DefaultWatchErrorHandler(r *Reflector, err error) {
- switch {
- case isExpiredError(err):
- // Don't set LastSyncResourceVersionUnavailable - LIST call with ResourceVersion=RV already
- // has a semantic that it returns data at least as fresh as provided RV.
- // So first try to LIST with setting RV to resource version of last observed object.
- klog.V(4).Infof("%s: watch of %v closed with: %v", r.name, r.typeDescription, err)
- case err == io.EOF:
- // watch closed normally
- case err == io.ErrUnexpectedEOF:
- klog.V(1).Infof("%s: Watch for %v closed with unexpected EOF: %v", r.name, r.typeDescription, err)
- default:
- utilruntime.HandleError(fmt.Errorf("%s: Failed to watch %v: %v", r.name, r.typeDescription, err))
- }
- }
- var (
- // We try to spread the load on apiserver by setting timeouts for
- // watch requests - it is random in [minWatchTimeout, 2*minWatchTimeout].
- minWatchTimeout = 5 * time.Minute
- )
- // NewNamespaceKeyedIndexerAndReflector creates an Indexer and a Reflector
- // The indexer is configured to key on namespace
- func NewNamespaceKeyedIndexerAndReflector(lw ListerWatcher, expectedType interface{}, resyncPeriod time.Duration) (indexer Indexer, reflector *Reflector) {
- indexer = NewIndexer(MetaNamespaceKeyFunc, Indexers{NamespaceIndex: MetaNamespaceIndexFunc})
- reflector = NewReflector(lw, expectedType, indexer, resyncPeriod)
- return indexer, reflector
- }
- // NewReflector creates a new Reflector with its name defaulted to the closest source_file.go:line in the call stack
- // that is outside this package. See NewReflectorWithOptions for further information.
- func NewReflector(lw ListerWatcher, expectedType interface{}, store Store, resyncPeriod time.Duration) *Reflector {
- return NewReflectorWithOptions(lw, expectedType, store, ReflectorOptions{ResyncPeriod: resyncPeriod})
- }
- // NewNamedReflector creates a new Reflector with the specified name. See NewReflectorWithOptions for further
- // information.
- func NewNamedReflector(name string, lw ListerWatcher, expectedType interface{}, store Store, resyncPeriod time.Duration) *Reflector {
- return NewReflectorWithOptions(lw, expectedType, store, ReflectorOptions{Name: name, ResyncPeriod: resyncPeriod})
- }
- // ReflectorOptions configures a Reflector.
- type ReflectorOptions struct {
- // Name is the Reflector's name. If unset/unspecified, the name defaults to the closest source_file.go:line
- // in the call stack that is outside this package.
- Name string
- // TypeDescription is the Reflector's type description. If unset/unspecified, the type description is defaulted
- // using the following rules: if the expectedType passed to NewReflectorWithOptions was nil, the type description is
- // "<unspecified>". If the expectedType is an instance of *unstructured.Unstructured and its apiVersion and kind fields
- // are set, the type description is the string encoding of those. Otherwise, the type description is set to the
- // go type of expectedType..
- TypeDescription string
- // ResyncPeriod is the Reflector's resync period. If unset/unspecified, the resync period defaults to 0
- // (do not resync).
- ResyncPeriod time.Duration
- // Clock allows tests to control time. If unset defaults to clock.RealClock{}
- Clock clock.Clock
- }
- // NewReflectorWithOptions creates a new Reflector object which will keep the
- // given store up to date with the server's contents for the given
- // resource. Reflector promises to only put things in the store that
- // have the type of expectedType, unless expectedType is nil. If
- // resyncPeriod is non-zero, then the reflector will periodically
- // consult its ShouldResync function to determine whether to invoke
- // the Store's Resync operation; `ShouldResync==nil` means always
- // "yes". This enables you to use reflectors to periodically process
- // everything as well as incrementally processing the things that
- // change.
- func NewReflectorWithOptions(lw ListerWatcher, expectedType interface{}, store Store, options ReflectorOptions) *Reflector {
- reflectorClock := options.Clock
- if reflectorClock == nil {
- reflectorClock = clock.RealClock{}
- }
- r := &Reflector{
- name: options.Name,
- resyncPeriod: options.ResyncPeriod,
- typeDescription: options.TypeDescription,
- listerWatcher: lw,
- store: store,
- // We used to make the call every 1sec (1 QPS), the goal here is to achieve ~98% traffic reduction when
- // API server is not healthy. With these parameters, backoff will stop at [30,60) sec interval which is
- // 0.22 QPS. If we don't backoff for 2min, assume API server is healthy and we reset the backoff.
- backoffManager: wait.NewExponentialBackoffManager(800*time.Millisecond, 30*time.Second, 2*time.Minute, 2.0, 1.0, reflectorClock),
- clock: reflectorClock,
- watchErrorHandler: WatchErrorHandler(DefaultWatchErrorHandler),
- expectedType: reflect.TypeOf(expectedType),
- }
- if r.name == "" {
- r.name = naming.GetNameFromCallsite(internalPackages...)
- }
- if r.typeDescription == "" {
- r.typeDescription = getTypeDescriptionFromObject(expectedType)
- }
- if r.expectedGVK == nil {
- r.expectedGVK = getExpectedGVKFromObject(expectedType)
- }
- if s := os.Getenv("ENABLE_CLIENT_GO_WATCH_LIST_ALPHA"); len(s) > 0 {
- r.UseWatchList = true
- }
- return r
- }
- func getTypeDescriptionFromObject(expectedType interface{}) string {
- if expectedType == nil {
- return defaultExpectedTypeName
- }
- reflectDescription := reflect.TypeOf(expectedType).String()
- obj, ok := expectedType.(*unstructured.Unstructured)
- if !ok {
- return reflectDescription
- }
- gvk := obj.GroupVersionKind()
- if gvk.Empty() {
- return reflectDescription
- }
- return gvk.String()
- }
- func getExpectedGVKFromObject(expectedType interface{}) *schema.GroupVersionKind {
- obj, ok := expectedType.(*unstructured.Unstructured)
- if !ok {
- return nil
- }
- gvk := obj.GroupVersionKind()
- if gvk.Empty() {
- return nil
- }
- return &gvk
- }
- // internalPackages are packages that ignored when creating a default reflector name. These packages are in the common
- // call chains to NewReflector, so they'd be low entropy names for reflectors
- var internalPackages = []string{"client-go/tools/cache/"}
- // Run repeatedly uses the reflector's ListAndWatch to fetch all the
- // objects and subsequent deltas.
- // Run will exit when stopCh is closed.
- func (r *Reflector) Run(stopCh <-chan struct{}) {
- klog.V(3).Infof("Starting reflector %s (%s) from %s", r.typeDescription, r.resyncPeriod, r.name)
- wait.BackoffUntil(func() {
- if err := r.ListAndWatch(stopCh); err != nil {
- r.watchErrorHandler(r, err)
- }
- }, r.backoffManager, true, stopCh)
- klog.V(3).Infof("Stopping reflector %s (%s) from %s", r.typeDescription, r.resyncPeriod, r.name)
- }
- var (
- // nothing will ever be sent down this channel
- neverExitWatch <-chan time.Time = make(chan time.Time)
- // Used to indicate that watching stopped because of a signal from the stop
- // channel passed in from a client of the reflector.
- errorStopRequested = errors.New("stop requested")
- )
- // resyncChan returns a channel which will receive something when a resync is
- // required, and a cleanup function.
- func (r *Reflector) resyncChan() (<-chan time.Time, func() bool) {
- if r.resyncPeriod == 0 {
- return neverExitWatch, func() bool { return false }
- }
- // The cleanup function is required: imagine the scenario where watches
- // always fail so we end up listing frequently. Then, if we don't
- // manually stop the timer, we could end up with many timers active
- // concurrently.
- t := r.clock.NewTimer(r.resyncPeriod)
- return t.C(), t.Stop
- }
- // ListAndWatch first lists all items and get the resource version at the moment of call,
- // and then use the resource version to watch.
- // It returns error if ListAndWatch didn't even try to initialize watch.
- func (r *Reflector) ListAndWatch(stopCh <-chan struct{}) error {
- klog.V(3).Infof("Listing and watching %v from %s", r.typeDescription, r.name)
- var err error
- var w watch.Interface
- fallbackToList := !r.UseWatchList
- if r.UseWatchList {
- w, err = r.watchList(stopCh)
- if w == nil && err == nil {
- // stopCh was closed
- return nil
- }
- if err != nil {
- if !apierrors.IsInvalid(err) {
- return err
- }
- klog.Warning("the watch-list feature is not supported by the server, falling back to the previous LIST/WATCH semantic")
- fallbackToList = true
- // Ensure that we won't accidentally pass some garbage down the watch.
- w = nil
- }
- }
- if fallbackToList {
- err = r.list(stopCh)
- if err != nil {
- return err
- }
- }
- resyncerrc := make(chan error, 1)
- cancelCh := make(chan struct{})
- defer close(cancelCh)
- go r.startResync(stopCh, cancelCh, resyncerrc)
- return r.watch(w, stopCh, resyncerrc)
- }
- // startResync periodically calls r.store.Resync() method.
- // Note that this method is blocking and should be
- // called in a separate goroutine.
- func (r *Reflector) startResync(stopCh <-chan struct{}, cancelCh <-chan struct{}, resyncerrc chan error) {
- resyncCh, cleanup := r.resyncChan()
- defer func() {
- cleanup() // Call the last one written into cleanup
- }()
- for {
- select {
- case <-resyncCh:
- case <-stopCh:
- return
- case <-cancelCh:
- return
- }
- if r.ShouldResync == nil || r.ShouldResync() {
- klog.V(4).Infof("%s: forcing resync", r.name)
- if err := r.store.Resync(); err != nil {
- resyncerrc <- err
- return
- }
- }
- cleanup()
- resyncCh, cleanup = r.resyncChan()
- }
- }
- // watch simply starts a watch request with the server.
- func (r *Reflector) watch(w watch.Interface, stopCh <-chan struct{}, resyncerrc chan error) error {
- var err error
- retry := NewRetryWithDeadline(r.MaxInternalErrorRetryDuration, time.Minute, apierrors.IsInternalError, r.clock)
- for {
- // give the stopCh a chance to stop the loop, even in case of continue statements further down on errors
- select {
- case <-stopCh:
- return nil
- default:
- }
- // start the clock before sending the request, since some proxies won't flush headers until after the first watch event is sent
- start := r.clock.Now()
- if w == nil {
- timeoutSeconds := int64(minWatchTimeout.Seconds() * (rand.Float64() + 1.0))
- options := metav1.ListOptions{
- ResourceVersion: r.LastSyncResourceVersion(),
- // We want to avoid situations of hanging watchers. Stop any watchers that do not
- // receive any events within the timeout window.
- TimeoutSeconds: &timeoutSeconds,
- // To reduce load on kube-apiserver on watch restarts, you may enable watch bookmarks.
- // Reflector doesn't assume bookmarks are returned at all (if the server do not support
- // watch bookmarks, it will ignore this field).
- AllowWatchBookmarks: true,
- }
- w, err = r.listerWatcher.Watch(options)
- if err != nil {
- if canRetry := isWatchErrorRetriable(err); canRetry {
- klog.V(4).Infof("%s: watch of %v returned %v - backing off", r.name, r.typeDescription, err)
- select {
- case <-stopCh:
- return nil
- case <-r.backoffManager.Backoff().C():
- continue
- }
- }
- return err
- }
- }
- err = watchHandler(start, w, r.store, r.expectedType, r.expectedGVK, r.name, r.typeDescription, r.setLastSyncResourceVersion, nil, r.clock, resyncerrc, stopCh)
- // Ensure that watch will not be reused across iterations.
- w.Stop()
- w = nil
- retry.After(err)
- if err != nil {
- if err != errorStopRequested {
- switch {
- case isExpiredError(err):
- // Don't set LastSyncResourceVersionUnavailable - LIST call with ResourceVersion=RV already
- // has a semantic that it returns data at least as fresh as provided RV.
- // So first try to LIST with setting RV to resource version of last observed object.
- klog.V(4).Infof("%s: watch of %v closed with: %v", r.name, r.typeDescription, err)
- case apierrors.IsTooManyRequests(err):
- klog.V(2).Infof("%s: watch of %v returned 429 - backing off", r.name, r.typeDescription)
- select {
- case <-stopCh:
- return nil
- case <-r.backoffManager.Backoff().C():
- continue
- }
- case apierrors.IsInternalError(err) && retry.ShouldRetry():
- klog.V(2).Infof("%s: retrying watch of %v internal error: %v", r.name, r.typeDescription, err)
- continue
- default:
- klog.Warningf("%s: watch of %v ended with: %v", r.name, r.typeDescription, err)
- }
- }
- return nil
- }
- }
- }
- // list simply lists all items and records a resource version obtained from the server at the moment of the call.
- // the resource version can be used for further progress notification (aka. watch).
- func (r *Reflector) list(stopCh <-chan struct{}) error {
- var resourceVersion string
- options := metav1.ListOptions{ResourceVersion: r.relistResourceVersion()}
- initTrace := trace.New("Reflector ListAndWatch", trace.Field{Key: "name", Value: r.name})
- defer initTrace.LogIfLong(10 * time.Second)
- var list runtime.Object
- var paginatedResult bool
- var err error
- listCh := make(chan struct{}, 1)
- panicCh := make(chan interface{}, 1)
- go func() {
- defer func() {
- if r := recover(); r != nil {
- panicCh <- r
- }
- }()
- // Attempt to gather list in chunks, if supported by listerWatcher, if not, the first
- // list request will return the full response.
- pager := pager.New(pager.SimplePageFunc(func(opts metav1.ListOptions) (runtime.Object, error) {
- return r.listerWatcher.List(opts)
- }))
- switch {
- case r.WatchListPageSize != 0:
- pager.PageSize = r.WatchListPageSize
- case r.paginatedResult:
- // We got a paginated result initially. Assume this resource and server honor
- // paging requests (i.e. watch cache is probably disabled) and leave the default
- // pager size set.
- case options.ResourceVersion != "" && options.ResourceVersion != "0":
- // User didn't explicitly request pagination.
- //
- // With ResourceVersion != "", we have a possibility to list from watch cache,
- // but we do that (for ResourceVersion != "0") only if Limit is unset.
- // To avoid thundering herd on etcd (e.g. on master upgrades), we explicitly
- // switch off pagination to force listing from watch cache (if enabled).
- // With the existing semantic of RV (result is at least as fresh as provided RV),
- // this is correct and doesn't lead to going back in time.
- //
- // We also don't turn off pagination for ResourceVersion="0", since watch cache
- // is ignoring Limit in that case anyway, and if watch cache is not enabled
- // we don't introduce regression.
- pager.PageSize = 0
- }
- list, paginatedResult, err = pager.ListWithAlloc(context.Background(), options)
- if isExpiredError(err) || isTooLargeResourceVersionError(err) {
- r.setIsLastSyncResourceVersionUnavailable(true)
- // Retry immediately if the resource version used to list is unavailable.
- // The pager already falls back to full list if paginated list calls fail due to an "Expired" error on
- // continuation pages, but the pager might not be enabled, the full list might fail because the
- // resource version it is listing at is expired or the cache may not yet be synced to the provided
- // resource version. So we need to fallback to resourceVersion="" in all to recover and ensure
- // the reflector makes forward progress.
- list, paginatedResult, err = pager.ListWithAlloc(context.Background(), metav1.ListOptions{ResourceVersion: r.relistResourceVersion()})
- }
- close(listCh)
- }()
- select {
- case <-stopCh:
- return nil
- case r := <-panicCh:
- panic(r)
- case <-listCh:
- }
- initTrace.Step("Objects listed", trace.Field{Key: "error", Value: err})
- if err != nil {
- klog.Warningf("%s: failed to list %v: %v", r.name, r.typeDescription, err)
- return fmt.Errorf("failed to list %v: %w", r.typeDescription, err)
- }
- // We check if the list was paginated and if so set the paginatedResult based on that.
- // However, we want to do that only for the initial list (which is the only case
- // when we set ResourceVersion="0"). The reasoning behind it is that later, in some
- // situations we may force listing directly from etcd (by setting ResourceVersion="")
- // which will return paginated result, even if watch cache is enabled. However, in
- // that case, we still want to prefer sending requests to watch cache if possible.
- //
- // Paginated result returned for request with ResourceVersion="0" mean that watch
- // cache is disabled and there are a lot of objects of a given type. In such case,
- // there is no need to prefer listing from watch cache.
- if options.ResourceVersion == "0" && paginatedResult {
- r.paginatedResult = true
- }
- r.setIsLastSyncResourceVersionUnavailable(false) // list was successful
- listMetaInterface, err := meta.ListAccessor(list)
- if err != nil {
- return fmt.Errorf("unable to understand list result %#v: %v", list, err)
- }
- resourceVersion = listMetaInterface.GetResourceVersion()
- initTrace.Step("Resource version extracted")
- items, err := meta.ExtractListWithAlloc(list)
- if err != nil {
- return fmt.Errorf("unable to understand list result %#v (%v)", list, err)
- }
- initTrace.Step("Objects extracted")
- if err := r.syncWith(items, resourceVersion); err != nil {
- return fmt.Errorf("unable to sync list result: %v", err)
- }
- initTrace.Step("SyncWith done")
- r.setLastSyncResourceVersion(resourceVersion)
- initTrace.Step("Resource version updated")
- return nil
- }
- // watchList establishes a stream to get a consistent snapshot of data
- // from the server as described in https://github.com/kubernetes/enhancements/tree/master/keps/sig-api-machinery/3157-watch-list#proposal
- //
- // case 1: start at Most Recent (RV="", ResourceVersionMatch=ResourceVersionMatchNotOlderThan)
- // Establishes a consistent stream with the server.
- // That means the returned data is consistent, as if, served directly from etcd via a quorum read.
- // It begins with synthetic "Added" events of all resources up to the most recent ResourceVersion.
- // It ends with a synthetic "Bookmark" event containing the most recent ResourceVersion.
- // After receiving a "Bookmark" event the reflector is considered to be synchronized.
- // It replaces its internal store with the collected items and
- // reuses the current watch requests for getting further events.
- //
- // case 2: start at Exact (RV>"0", ResourceVersionMatch=ResourceVersionMatchNotOlderThan)
- // Establishes a stream with the server at the provided resource version.
- // To establish the initial state the server begins with synthetic "Added" events.
- // It ends with a synthetic "Bookmark" event containing the provided or newer resource version.
- // After receiving a "Bookmark" event the reflector is considered to be synchronized.
- // It replaces its internal store with the collected items and
- // reuses the current watch requests for getting further events.
- func (r *Reflector) watchList(stopCh <-chan struct{}) (watch.Interface, error) {
- var w watch.Interface
- var err error
- var temporaryStore Store
- var resourceVersion string
- // TODO(#115478): see if this function could be turned
- // into a method and see if error handling
- // could be unified with the r.watch method
- isErrorRetriableWithSideEffectsFn := func(err error) bool {
- if canRetry := isWatchErrorRetriable(err); canRetry {
- klog.V(2).Infof("%s: watch-list of %v returned %v - backing off", r.name, r.typeDescription, err)
- <-r.backoffManager.Backoff().C()
- return true
- }
- if isExpiredError(err) || isTooLargeResourceVersionError(err) {
- // we tried to re-establish a watch request but the provided RV
- // has either expired or it is greater than the server knows about.
- // In that case we reset the RV and
- // try to get a consistent snapshot from the watch cache (case 1)
- r.setIsLastSyncResourceVersionUnavailable(true)
- return true
- }
- return false
- }
- initTrace := trace.New("Reflector WatchList", trace.Field{Key: "name", Value: r.name})
- defer initTrace.LogIfLong(10 * time.Second)
- for {
- select {
- case <-stopCh:
- return nil, nil
- default:
- }
- resourceVersion = ""
- lastKnownRV := r.rewatchResourceVersion()
- temporaryStore = NewStore(DeletionHandlingMetaNamespaceKeyFunc)
- // TODO(#115478): large "list", slow clients, slow network, p&f
- // might slow down streaming and eventually fail.
- // maybe in such a case we should retry with an increased timeout?
- timeoutSeconds := int64(minWatchTimeout.Seconds() * (rand.Float64() + 1.0))
- options := metav1.ListOptions{
- ResourceVersion: lastKnownRV,
- AllowWatchBookmarks: true,
- SendInitialEvents: pointer.Bool(true),
- ResourceVersionMatch: metav1.ResourceVersionMatchNotOlderThan,
- TimeoutSeconds: &timeoutSeconds,
- }
- start := r.clock.Now()
- w, err = r.listerWatcher.Watch(options)
- if err != nil {
- if isErrorRetriableWithSideEffectsFn(err) {
- continue
- }
- return nil, err
- }
- bookmarkReceived := pointer.Bool(false)
- err = watchHandler(start, w, temporaryStore, r.expectedType, r.expectedGVK, r.name, r.typeDescription,
- func(rv string) { resourceVersion = rv },
- bookmarkReceived,
- r.clock, make(chan error), stopCh)
- if err != nil {
- w.Stop() // stop and retry with clean state
- if err == errorStopRequested {
- return nil, nil
- }
- if isErrorRetriableWithSideEffectsFn(err) {
- continue
- }
- return nil, err
- }
- if *bookmarkReceived {
- break
- }
- }
- // We successfully got initial state from watch-list confirmed by the
- // "k8s.io/initial-events-end" bookmark.
- initTrace.Step("Objects streamed", trace.Field{Key: "count", Value: len(temporaryStore.List())})
- r.setIsLastSyncResourceVersionUnavailable(false)
- if err = r.store.Replace(temporaryStore.List(), resourceVersion); err != nil {
- return nil, fmt.Errorf("unable to sync watch-list result: %v", err)
- }
- initTrace.Step("SyncWith done")
- r.setLastSyncResourceVersion(resourceVersion)
- return w, nil
- }
- // syncWith replaces the store's items with the given list.
- func (r *Reflector) syncWith(items []runtime.Object, resourceVersion string) error {
- found := make([]interface{}, 0, len(items))
- for _, item := range items {
- found = append(found, item)
- }
- return r.store.Replace(found, resourceVersion)
- }
- // watchHandler watches w and sets setLastSyncResourceVersion
- func watchHandler(start time.Time,
- w watch.Interface,
- store Store,
- expectedType reflect.Type,
- expectedGVK *schema.GroupVersionKind,
- name string,
- expectedTypeName string,
- setLastSyncResourceVersion func(string),
- exitOnInitialEventsEndBookmark *bool,
- clock clock.Clock,
- errc chan error,
- stopCh <-chan struct{},
- ) error {
- eventCount := 0
- if exitOnInitialEventsEndBookmark != nil {
- // set it to false just in case somebody
- // made it positive
- *exitOnInitialEventsEndBookmark = false
- }
- loop:
- for {
- select {
- case <-stopCh:
- return errorStopRequested
- case err := <-errc:
- return err
- case event, ok := <-w.ResultChan():
- if !ok {
- break loop
- }
- if event.Type == watch.Error {
- return apierrors.FromObject(event.Object)
- }
- if expectedType != nil {
- if e, a := expectedType, reflect.TypeOf(event.Object); e != a {
- utilruntime.HandleError(fmt.Errorf("%s: expected type %v, but watch event object had type %v", name, e, a))
- continue
- }
- }
- if expectedGVK != nil {
- if e, a := *expectedGVK, event.Object.GetObjectKind().GroupVersionKind(); e != a {
- utilruntime.HandleError(fmt.Errorf("%s: expected gvk %v, but watch event object had gvk %v", name, e, a))
- continue
- }
- }
- meta, err := meta.Accessor(event.Object)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("%s: unable to understand watch event %#v", name, event))
- continue
- }
- resourceVersion := meta.GetResourceVersion()
- switch event.Type {
- case watch.Added:
- err := store.Add(event.Object)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("%s: unable to add watch event object (%#v) to store: %v", name, event.Object, err))
- }
- case watch.Modified:
- err := store.Update(event.Object)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("%s: unable to update watch event object (%#v) to store: %v", name, event.Object, err))
- }
- case watch.Deleted:
- // TODO: Will any consumers need access to the "last known
- // state", which is passed in event.Object? If so, may need
- // to change this.
- err := store.Delete(event.Object)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("%s: unable to delete watch event object (%#v) from store: %v", name, event.Object, err))
- }
- case watch.Bookmark:
- // A `Bookmark` means watch has synced here, just update the resourceVersion
- if _, ok := meta.GetAnnotations()["k8s.io/initial-events-end"]; ok {
- if exitOnInitialEventsEndBookmark != nil {
- *exitOnInitialEventsEndBookmark = true
- }
- }
- default:
- utilruntime.HandleError(fmt.Errorf("%s: unable to understand watch event %#v", name, event))
- }
- setLastSyncResourceVersion(resourceVersion)
- if rvu, ok := store.(ResourceVersionUpdater); ok {
- rvu.UpdateResourceVersion(resourceVersion)
- }
- eventCount++
- if exitOnInitialEventsEndBookmark != nil && *exitOnInitialEventsEndBookmark {
- watchDuration := clock.Since(start)
- klog.V(4).Infof("exiting %v Watch because received the bookmark that marks the end of initial events stream, total %v items received in %v", name, eventCount, watchDuration)
- return nil
- }
- }
- }
- watchDuration := clock.Since(start)
- if watchDuration < 1*time.Second && eventCount == 0 {
- return fmt.Errorf("very short watch: %s: Unexpected watch close - watch lasted less than a second and no items received", name)
- }
- klog.V(4).Infof("%s: Watch close - %v total %v items received", name, expectedTypeName, eventCount)
- return nil
- }
- // LastSyncResourceVersion is the resource version observed when last sync with the underlying store
- // The value returned is not synchronized with access to the underlying store and is not thread-safe
- func (r *Reflector) LastSyncResourceVersion() string {
- r.lastSyncResourceVersionMutex.RLock()
- defer r.lastSyncResourceVersionMutex.RUnlock()
- return r.lastSyncResourceVersion
- }
- func (r *Reflector) setLastSyncResourceVersion(v string) {
- r.lastSyncResourceVersionMutex.Lock()
- defer r.lastSyncResourceVersionMutex.Unlock()
- r.lastSyncResourceVersion = v
- }
- // relistResourceVersion determines the resource version the reflector should list or relist from.
- // Returns either the lastSyncResourceVersion so that this reflector will relist with a resource
- // versions no older than has already been observed in relist results or watch events, or, if the last relist resulted
- // in an HTTP 410 (Gone) status code, returns "" so that the relist will use the latest resource version available in
- // etcd via a quorum read.
- func (r *Reflector) relistResourceVersion() string {
- r.lastSyncResourceVersionMutex.RLock()
- defer r.lastSyncResourceVersionMutex.RUnlock()
- if r.isLastSyncResourceVersionUnavailable {
- // Since this reflector makes paginated list requests, and all paginated list requests skip the watch cache
- // if the lastSyncResourceVersion is unavailable, we set ResourceVersion="" and list again to re-establish reflector
- // to the latest available ResourceVersion, using a consistent read from etcd.
- return ""
- }
- if r.lastSyncResourceVersion == "" {
- // For performance reasons, initial list performed by reflector uses "0" as resource version to allow it to
- // be served from the watch cache if it is enabled.
- return "0"
- }
- return r.lastSyncResourceVersion
- }
- // rewatchResourceVersion determines the resource version the reflector should start streaming from.
- func (r *Reflector) rewatchResourceVersion() string {
- r.lastSyncResourceVersionMutex.RLock()
- defer r.lastSyncResourceVersionMutex.RUnlock()
- if r.isLastSyncResourceVersionUnavailable {
- // initial stream should return data at the most recent resource version.
- // the returned data must be consistent i.e. as if served from etcd via a quorum read
- return ""
- }
- return r.lastSyncResourceVersion
- }
- // setIsLastSyncResourceVersionUnavailable sets if the last list or watch request with lastSyncResourceVersion returned
- // "expired" or "too large resource version" error.
- func (r *Reflector) setIsLastSyncResourceVersionUnavailable(isUnavailable bool) {
- r.lastSyncResourceVersionMutex.Lock()
- defer r.lastSyncResourceVersionMutex.Unlock()
- r.isLastSyncResourceVersionUnavailable = isUnavailable
- }
- func isExpiredError(err error) bool {
- // In Kubernetes 1.17 and earlier, the api server returns both apierrors.StatusReasonExpired and
- // apierrors.StatusReasonGone for HTTP 410 (Gone) status code responses. In 1.18 the kube server is more consistent
- // and always returns apierrors.StatusReasonExpired. For backward compatibility we can only remove the apierrors.IsGone
- // check when we fully drop support for Kubernetes 1.17 servers from reflectors.
- return apierrors.IsResourceExpired(err) || apierrors.IsGone(err)
- }
- func isTooLargeResourceVersionError(err error) bool {
- if apierrors.HasStatusCause(err, metav1.CauseTypeResourceVersionTooLarge) {
- return true
- }
- // In Kubernetes 1.17.0-1.18.5, the api server doesn't set the error status cause to
- // metav1.CauseTypeResourceVersionTooLarge to indicate that the requested minimum resource
- // version is larger than the largest currently available resource version. To ensure backward
- // compatibility with these server versions we also need to detect the error based on the content
- // of the error message field.
- if !apierrors.IsTimeout(err) {
- return false
- }
- apierr, ok := err.(apierrors.APIStatus)
- if !ok || apierr == nil || apierr.Status().Details == nil {
- return false
- }
- for _, cause := range apierr.Status().Details.Causes {
- // Matches the message returned by api server 1.17.0-1.18.5 for this error condition
- if cause.Message == "Too large resource version" {
- return true
- }
- }
- // Matches the message returned by api server before 1.17.0
- if strings.Contains(apierr.Status().Message, "Too large resource version") {
- return true
- }
- return false
- }
- // isWatchErrorRetriable determines if it is safe to retry
- // a watch error retrieved from the server.
- func isWatchErrorRetriable(err error) bool {
- // If this is "connection refused" error, it means that most likely apiserver is not responsive.
- // It doesn't make sense to re-list all objects because most likely we will be able to restart
- // watch where we ended.
- // If that's the case begin exponentially backing off and resend watch request.
- // Do the same for "429" errors.
- if utilnet.IsConnectionRefused(err) || apierrors.IsTooManyRequests(err) {
- return true
- }
- return false
- }
|