cache - watch cache - 《学习笔记》

const (
    // 主要是若给定版本的obj不在cache，需要去etcd fetch数据
    // 此参数代表了fetch的超时时间
    blockTimeout = 3 * time.Second
    // 客户端收到too high resource version异常需要先block的时长，然后再重拾
    resourceVersionTooHighRetrySeconds = 1
)
// 为了避免多次计算obj的key/label/field，需要缓存这些值
type storeElement struct {
    Key    string
    Object runtime.Object
    Labels labels.Set
    Fields fields.Set
}
func storeElementKey(obj interface{}) (string, error) {
    elem, ok := obj.(*storeElement)
    if !ok {
        return "", fmt.Errorf("not a storeElement: %v", obj)
    }
    return elem.Key, nil
}
func storeElementObject(obj interface{}) (runtime.Object, error) {
    elem, ok := obj.(*storeElement)
    if !ok {
        return nil, fmt.Errorf("not a storeElement: %v", obj)
    }
    return elem.Object, nil
}
func storeElementIndexFunc(objIndexFunc cache.IndexFunc) cache.IndexFunc {
    return func(obj interface{}) (strings []string, e error) {
        seo, err := storeElementObject(obj)
        if err != nil {
            return nil, err
        }
        return objIndexFunc(seo)
    }
}
func storeElementIndexers(indexers *cache.Indexers) cache.Indexers {
    if indexers == nil {
        return cache.Indexers{}
    }
    ret := cache.Indexers{}
    for indexName, indexFunc := range *indexers {
        ret[indexName] = storeElementIndexFunc(indexFunc)
    }
    return ret
}
// watchCache实际上是一个滑动窗口
// 维护固定数量的obj
type watchCache struct {
    sync.RWMutex
    // 等待刷新足够的版本数据到cache
    cond *sync.Cond
    // 滑动窗口的容量
    capacity     int
    keyFunc      func(runtime.Object) (string, error)
    getAttrsFunc func(runtime.Object) (labels.Set, fields.Set, error)
    // cache is used a cyclic buffer - its first element (with the smallest
    // resourceVersion) is defined by startIndex, its last element is defined
    // by endIndex (if cache is full it will be startIndex + capacity).
    // Both startIndex and endIndex can be greater than buffer capacity -
    // you should always apply modulo capacity to get an index in cache array.
    cache      []*watchCacheEvent
    startIndex int
    endIndex   int
    // store will effectively support LIST operation from the "end of cache
    // history" i.e. from the moment just after the newest cached watched event.
    // It is necessary to effectively allow clients to start watching at now.
    // NOTE: We assume that <store> is thread-safe.
    store cache.Indexer
    // ResourceVersion up to which the watchCache is propagated.
    resourceVersion uint64
    // ResourceVersion of the last list result (populated via Replace() method).
    listResourceVersion uint64
    // This handler is run at the end of every successful Replace() method.
    onReplace func()
    // 事件处理器
    eventHandler func(*watchCacheEvent)
    clock        clock.Clock
    // 获取obj的resourceversion信息
    versioner storage.Versioner
}
type watchCacheEvent struct {
    Key             string
    ResourceVersion uint64
    Type            watch.EventType
    Object          runtime.Object
    ObjLabels       labels.Set
    ObjFields       fields.Set
    PrevObject      runtime.Object
    PrevObjLabels   labels.Set
    PrevObjFields   fields.Set
}
func newWatchCache(
    capacity int,
    keyFunc func(runtime.Object) (string, error),
    eventHandler func(*watchCacheEvent),
    getAttrsFunc func(runtime.Object) (labels.Set, fields.Set, error),
    versioner storage.Versioner,
    indexers *cache.Indexers) *watchCache {
    wc := &watchCache{
        capacity:            capacity,
        keyFunc:             keyFunc,
        getAttrsFunc:        getAttrsFunc,
        cache:               make([]*watchCacheEvent, capacity),
        startIndex:          0,
        endIndex:            0,
        store:               cache.NewIndexer(storeElementKey, storeElementIndexers(indexers)),
        resourceVersion:     0,
        listResourceVersion: 0,
        eventHandler:        eventHandler,
        clock:               clock.RealClock{},
        versioner:           versioner,
    }
    wc.cond = sync.NewCond(wc.RLocker())
    return wc
}
func (w *watchCache) Add(obj interface{}) error {
    object, resourceVersion, err := w.objectToVersionedRuntimeObject(obj)
    if err != nil {
        return err
    }
    event := watch.Event{Type: watch.Added, Object: object}
    f := func(elem *storeElement) error { return w.store.Add(elem) }
    return w.processEvent(event, resourceVersion, f)
}
func (w *watchCache) Update(obj interface{}) error {
    object, resourceVersion, err := w.objectToVersionedRuntimeObject(obj)
    if err != nil {
        return err
    }
    event := watch.Event{Type: watch.Modified, Object: object}
    f := func(elem *storeElement) error { return w.store.Update(elem) }
    return w.processEvent(event, resourceVersion, f)
}
func (w *watchCache) Delete(obj interface{}) error {
    object, resourceVersion, err := w.objectToVersionedRuntimeObject(obj)
    if err != nil {
        return err
    }
    event := watch.Event{Type: watch.Deleted, Object: object}
    f := func(elem *storeElement) error { return w.store.Delete(elem) }
    return w.processEvent(event, resourceVersion, f)
}
func (w *watchCache) List() []interface{} {
    return w.store.List()
}
func (w *watchCache) ListKeys() []string {
    return w.store.ListKeys()
}
func (w *watchCache) WaitUntilFreshAndList(resourceVersion uint64, matchValues []storage.MatchValue, trace *utiltrace.Trace) ([]interface{}, uint64, error) {
    err := w.waitUntilFreshAndBlock(resourceVersion, trace)
    defer w.RUnlock()
    if err != nil {
        return nil, 0, err
    }
    // This isn't the place where we do "final filtering" - only some "prefiltering" is happening here. So the only
    // requirement here is to NOT miss anything that should be returned. We can return as many non-matching items as we
    // want - they will be filtered out later. The fact that we return less things is only further performance improvement.
    // TODO: if multiple indexes match, return the one with the fewest items, so as to do as much filtering as possible.
    for _, matchValue := range matchValues {
        if result, err := w.store.ByIndex(matchValue.IndexName, matchValue.Value); err == nil {
            return result, w.resourceVersion, nil
        }
    }
    return w.store.List(), w.resourceVersion, nil
}
func (w *watchCache) WaitUntilFreshAndGet(resourceVersion uint64, key string, trace *utiltrace.Trace) (interface{}, bool, uint64, error) {
    err := w.waitUntilFreshAndBlock(resourceVersion, trace)
    defer w.RUnlock()
    if err != nil {
        return nil, false, 0, err
    }
    value, exists, err := w.store.GetByKey(key)
    return value, exists, w.resourceVersion, err
}
func (w *watchCache) Get(obj interface{}) (interface{}, bool, error) {
    object, ok := obj.(runtime.Object)
    if !ok {
        return nil, false, fmt.Errorf("obj does not implement runtime.Object interface: %v", obj)
    }
    key, err := w.keyFunc(object)
    if err != nil {
        return nil, false, fmt.Errorf("couldn't compute key: %v", err)
    }
    return w.store.Get(&storeElement{Key: key, Object: object})
}
func (w *watchCache) GetByKey(key string) (interface{}, bool, error) {
    return w.store.GetByKey(key)
}
func (w *watchCache) Replace(objs []interface{}, resourceVersion string) error {
    version, err := w.versioner.ParseResourceVersion(resourceVersion)
    if err != nil {
        return err
    }
    toReplace := make([]interface{}, 0, len(objs))
    for _, obj := range objs {
        object, ok := obj.(runtime.Object)
        if !ok {
            return fmt.Errorf("didn't get runtime.Object for replace: %#v", obj)
        }
        key, err := w.keyFunc(object)
        if err != nil {
            return fmt.Errorf("couldn't compute key: %v", err)
        }
        objLabels, objFields, err := w.getAttrsFunc(object)
        if err != nil {
            return err
        }
        toReplace = append(toReplace, &storeElement{
            Key:    key,
            Object: object,
            Labels: objLabels,
            Fields: objFields,
        })
    }
    w.Lock()
    defer w.Unlock()
    w.startIndex = 0
    w.endIndex = 0
    if err := w.store.Replace(toReplace, resourceVersion); err != nil {
        return err
    }
    w.listResourceVersion = version
    w.resourceVersion = version
    if w.onReplace != nil {
        w.onReplace()
    }
    w.cond.Broadcast()
    return nil
}
func (w *watchCache) SetOnReplace(onReplace func()) {
    w.Lock()
    defer w.Unlock()
    w.onReplace = onReplace
}
func (w *watchCache) GetAllEventsSinceThreadUnsafe(resourceVersion uint64) ([]*watchCacheEvent, error) {
    size := w.endIndex - w.startIndex
    var oldest uint64
    switch {
    case size >= w.capacity:
        // Once the watch event buffer is full, the oldest watch event we can deliver
        // is the first one in the buffer.
        oldest = w.cache[w.startIndex%w.capacity].ResourceVersion
    case w.listResourceVersion > 0:
        // If the watch event buffer isn't full, the oldest watch event we can deliver
        // is one greater than the resource version of the last full list.
        oldest = w.listResourceVersion + 1
    case size > 0:
        // If we've never completed a list, use the resourceVersion of the oldest event
        // in the buffer.
        // This should only happen in unit tests that populate the buffer without
        // performing list/replace operations.
        oldest = w.cache[w.startIndex%w.capacity].ResourceVersion
    default:
        return nil, fmt.Errorf("watch cache isn't correctly initialized")
    }
    if resourceVersion == 0 {
        // resourceVersion = 0 means that we don't require any specific starting point
        // and we would like to start watching from ~now.
        // However, to keep backward compatibility, we additionally need to return the
        // current state and only then start watching from that point.
        //
        // TODO: In v2 api, we should stop returning the current state - #13969.
        allItems := w.store.List()
        result := make([]*watchCacheEvent, len(allItems))
        for i, item := range allItems {
            elem, ok := item.(*storeElement)
            if !ok {
                return nil, fmt.Errorf("not a storeElement: %v", elem)
            }
            objLabels, objFields, err := w.getAttrsFunc(elem.Object)
            if err != nil {
                return nil, err
            }
            result[i] = &watchCacheEvent{
                Type:            watch.Added,
                Object:          elem.Object,
                ObjLabels:       objLabels,
                ObjFields:       objFields,
                Key:             elem.Key,
                ResourceVersion: w.resourceVersion,
            }
        }
        return result, nil
    }
    if resourceVersion < oldest-1 {
        return nil, errors.NewResourceExpired(fmt.Sprintf("too old resource version: %d (%d)", resourceVersion, oldest-1))
    }
    // Binary search the smallest index at which resourceVersion is greater than the given one.
    f := func(i int) bool {
        return w.cache[(w.startIndex+i)%w.capacity].ResourceVersion > resourceVersion
    }
    first := sort.Search(size, f)
    result := make([]*watchCacheEvent, size-first)
    for i := 0; i < size-first; i++ {
        result[i] = w.cache[(w.startIndex+first+i)%w.capacity]
    }
    return result, nil
}
func (w *watchCache) GetAllEventsSince(resourceVersion uint64) ([]*watchCacheEvent, error) {
    w.RLock()
    defer w.RUnlock()
    return w.GetAllEventsSinceThreadUnsafe(resourceVersion)
}
func (w *watchCache) Resync() error {
    return nil
}
func (w *watchCache) processEvent(event watch.Event, resourceVersion uint64, updateFunc func(*storeElement) error) error {
    key, err := w.keyFunc(event.Object)
    if err != nil {
        return fmt.Errorf("couldn't compute key: %v", err)
    }
    elem := &storeElement{Key: key, Object: event.Object}
    elem.Labels, elem.Fields, err = w.getAttrsFunc(event.Object)
    if err != nil {
        return err
    }
    wcEvent := &watchCacheEvent{
        Type:            event.Type,
        Object:          elem.Object,
        ObjLabels:       elem.Labels,
        ObjFields:       elem.Fields,
        Key:             key,
        ResourceVersion: resourceVersion,
    }
    if err := func() error {
        // TODO: We should consider moving this lock below after the watchCacheEvent
        // is created. In such situation, the only problematic scenario is Replace(
        // happening after getting object from store and before acquiring a lock.
        // Maybe introduce another lock for this purpose.
        w.Lock()
        defer w.Unlock()
        previous, exists, err := w.store.Get(elem)
        if err != nil {
            return err
        }
        if exists {
            previousElem := previous.(*storeElement)
            wcEvent.PrevObject = previousElem.Object
            wcEvent.PrevObjLabels = previousElem.Labels
            wcEvent.PrevObjFields = previousElem.Fields
        }
        w.updateCache(wcEvent)
        w.resourceVersion = resourceVersion
        defer w.cond.Broadcast()
        return updateFunc(elem)
    }(); err != nil {
        return err
    }
    // Avoid calling event handler under lock.
    // This is safe as long as there is at most one call to processEvent in flight
    // at any point in time.
    if w.eventHandler != nil {
        w.eventHandler(wcEvent)
    }
    return nil
}
func (w *watchCache) updateCache(event *watchCacheEvent) {
    if w.endIndex == w.startIndex+w.capacity {
        // Cache is full - remove the oldest element.
        w.startIndex++
    }
    w.cache[w.endIndex%w.capacity] = event
    w.endIndex++
}
func (w *watchCache) waitUntilFreshAndBlock(resourceVersion uint64, trace *utiltrace.Trace) error {
    startTime := w.clock.Now()
    go func() {
        // Wake us up when the time limit has expired.  The docs
        // promise that time.After (well, NewTimer, which it calls)
        // will wait *at least* the duration given. Since this go
        // routine starts sometime after we record the start time, and
        // it will wake up the loop below sometime after the broadcast,
        // we don't need to worry about waking it up before the time
        // has expired accidentally.
        <-w.clock.After(blockTimeout)
        w.cond.Broadcast()
    }()
    w.RLock()
    if trace != nil {
        trace.Step("watchCache locked acquired")
    }
    for w.resourceVersion < resourceVersion {
        if w.clock.Since(startTime) >= blockTimeout {
            // Request that the client retry after 'resourceVersionTooHighRetrySeconds' seconds.
            return storage.NewTooLargeResourceVersionError(resourceVersion, w.resourceVersion, resourceVersionTooHighRetrySeconds)
        }
        w.cond.Wait()
    }
    if trace != nil {
        trace.Step("watchCache fresh enough")
    }
    return nil
}
// 解析obj为runtime.Object、version
func (w *watchCache) objectToVersionedRuntimeObject(obj interface{}) (runtime.Object, uint64, error) {
    object, ok := obj.(runtime.Object)
    if !ok {
        return nil, 0, fmt.Errorf("obj does not implement runtime.Object interface: %v", obj)
    }
    resourceVersion, err := w.versioner.ObjectResourceVersion(object)
    if err != nil {
        return nil, 0, err
    }
    return object, resourceVersion, nil
}