cortexproject · tomwilkie · Jan 7, 2019 · Nov 26, 2018 · Nov 26, 2018 · Jan 7, 2019
diff --git a/pkg/chunk/chunk_store.go b/pkg/chunk/chunk_store.go
@@ -61,6 +61,8 @@ type StoreConfig struct {
 	CardinalityCacheSize     int
 	CardinalityCacheValidity time.Duration
 	CardinalityLimit         int
+
+	CacheLookupsOlderThan time.Duration
 }
 
 // RegisterFlags adds the flags required to config this to the given FlagSet
@@ -73,6 +75,7 @@ func (cfg *StoreConfig) RegisterFlags(f *flag.FlagSet) {
 	f.IntVar(&cfg.CardinalityCacheSize, "store.cardinality-cache-size", 0, "Size of in-memory cardinality cache, 0 to disable.")
 	f.DurationVar(&cfg.CardinalityCacheValidity, "store.cardinality-cache-validity", 1*time.Hour, "Period for which entries in the cardinality cache are valid.")
 	f.IntVar(&cfg.CardinalityLimit, "store.cardinality-limit", 1e5, "Cardinality limit for index queries.")
+	f.DurationVar(&cfg.CacheLookupsOlderThan, "store.cache-lookups-older-than", 0, "Cache index entries older than this period. 0 to disable.")
 }
 
 // store implements Store

diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
@@ -58,6 +58,9 @@ type IndexQuery struct {
 
 	// Filters for querying
 	ValueEqual []byte
+
+	// If the result of this lookup is immutable or not (for caching).
+	Immutable bool
 }
 
 // IndexEntry describes an entry in the chunk index

diff --git a/pkg/chunk/schema_caching.go b/pkg/chunk/schema_caching.go
@@ -0,0 +1,113 @@
+package chunk
+
+import (
+	"time"
+
+	"github.com/prometheus/common/model"
+	"github.com/weaveworks/common/mtime"
+)
+
+type schemaCaching struct {
+	Schema
+
+	cacheOlderThan time.Duration
+}
+
+func (s *schemaCaching) GetReadQueriesForMetric(from, through model.Time, userID string, metricName model.LabelValue) ([]IndexQuery, error) {
+	cFrom, cThrough, from, through := splitTimesByCacheability(from, through, model.TimeFromUnix(mtime.Now().Add(-s.cacheOlderThan).Unix()))
+
+	cacheableQueries, err := s.Schema.GetReadQueriesForMetric(cFrom, cThrough, userID, metricName)
+	if err != nil {
+		return nil, err
+	}
+
+	activeQueries, err := s.Schema.GetReadQueriesForMetric(from, through, userID, metricName)
+	if err != nil {
+		return nil, err
+	}
+
+	return mergeCacheableAndActiveQueries(cacheableQueries, activeQueries), nil
+}
+
+func (s *schemaCaching) GetReadQueriesForMetricLabel(from, through model.Time, userID string, metricName model.LabelValue, labelName model.LabelName) ([]IndexQuery, error) {
+	cFrom, cThrough, from, through := splitTimesByCacheability(from, through, model.TimeFromUnix(mtime.Now().Add(-s.cacheOlderThan).Unix()))
+
+	cacheableQueries, err := s.Schema.GetReadQueriesForMetricLabel(cFrom, cThrough, userID, metricName, labelName)
+	if err != nil {
+		return nil, err
+	}
+
+	activeQueries, err := s.Schema.GetReadQueriesForMetricLabel(from, through, userID, metricName, labelName)
+	if err != nil {
+		return nil, err
+	}
+
+	return mergeCacheableAndActiveQueries(cacheableQueries, activeQueries), nil
+}
+
+func (s *schemaCaching) GetReadQueriesForMetricLabelValue(from, through model.Time, userID string, metricName model.LabelValue, labelName model.LabelName, labelValue model.LabelValue) ([]IndexQuery, error) {
+	cFrom, cThrough, from, through := splitTimesByCacheability(from, through, model.TimeFromUnix(mtime.Now().Add(-s.cacheOlderThan).Unix()))
+
+	cacheableQueries, err := s.Schema.GetReadQueriesForMetricLabelValue(cFrom, cThrough, userID, metricName, labelName, labelValue)
+	if err != nil {
+		return nil, err
+	}
+
+	activeQueries, err := s.Schema.GetReadQueriesForMetricLabelValue(from, through, userID, metricName, labelName, labelValue)
+	if err != nil {
+		return nil, err
+	}
+
+	return mergeCacheableAndActiveQueries(cacheableQueries, activeQueries), nil
+}
+
+// If the query resulted in series IDs, use this method to find chunks.
+func (s *schemaCaching) GetChunksForSeries(from, through model.Time, userID string, seriesID []byte) ([]IndexQuery, error) {
+	cFrom, cThrough, from, through := splitTimesByCacheability(from, through, model.TimeFromUnix(mtime.Now().Add(-s.cacheOlderThan).Unix()))
+
+	cacheableQueries, err := s.Schema.GetChunksForSeries(cFrom, cThrough, userID, seriesID)
+	if err != nil {
+		return nil, err
+	}
+
+	activeQueries, err := s.Schema.GetChunksForSeries(from, through, userID, seriesID)
+	if err != nil {
+		return nil, err
+	}
+
+	return mergeCacheableAndActiveQueries(cacheableQueries, activeQueries), nil
+}
+
+func splitTimesByCacheability(from, through model.Time, cacheBefore model.Time) (model.Time, model.Time, model.Time, model.Time) {
+	if from.After(cacheBefore) {
+		return 0, 0, from, through
+	}
+
+	if through.Before(cacheBefore) {
+		return from, through, 0, 0
+	}
+
+	return from, cacheBefore, cacheBefore, through
+}
+
+func mergeCacheableAndActiveQueries(cacheableQueries []IndexQuery, activeQueries []IndexQuery) []IndexQuery {
+	finalQueries := make([]IndexQuery, 0, len(cacheableQueries)+len(activeQueries))
+
+Outer:
+	for _, cq := range cacheableQueries {
+		for _, aq := range activeQueries {
+			// When deduping, the bucket values only influence TableName and HashValue
+			// and just checking those is enough.
+			if cq.TableName == aq.TableName && cq.HashValue == aq.HashValue {
+				continue Outer
+			}
+		}
+
+		cq.Immutable = true
+		finalQueries = append(finalQueries, cq)
+	}
+
+	finalQueries = append(finalQueries, activeQueries...)
+
+	return finalQueries
+}
diff --git a/pkg/chunk/schema_caching_test.go b/pkg/chunk/schema_caching_test.go
@@ -0,0 +1,75 @@
+package chunk
+
+import (
+	"testing"
+	"time"
+
+	"github.com/prometheus/common/model"
+	"github.com/stretchr/testify/require"
+	"github.com/weaveworks/common/mtime"
+)
+
+func TestCachingSchema(t *testing.T) {
+	const (
+		userID         = "userid"
+		periodicPrefix = "periodicPrefix"
+	)
+
+	dailyBuckets := makeSchema("v3")
+	schema := &schemaCaching{
+		Schema:         dailyBuckets,
+		cacheOlderThan: 24 * time.Hour,
+	}
+
+	baseTime := time.Unix(0, 0)
+	baseTime = baseTime.Add(30*24*time.Hour - 1)
+
+	mtime.NowForce(baseTime)
+
+	for _, tc := range []struct {
+		from, through time.Time
+
+		cacheableIdx int
+	}{
+		{
+			// Completely cacheable.
+			baseTime.Add(-36 * time.Hour),
+			baseTime.Add(-25 * time.Hour),
+			0,
+		},
+		{
+			// Completely active.
+			baseTime.Add(-23 * time.Hour),
+			baseTime.Add(-2 * time.Hour),
+			-1,
+		},
+		{
+			// Mix of both but the cacheable entry is also active.
+			baseTime.Add(-36 * time.Hour),
+			baseTime.Add(-2 * time.Hour),
+			-1,
+		},
+		{
+			// Mix of both.
+			baseTime.Add(-50 * time.Hour),
+			baseTime.Add(-2 * time.Hour),
+			0,
+		},
+	} {
+		have, err := schema.GetReadQueriesForMetric(
+			model.TimeFromUnix(tc.from.Unix()), model.TimeFromUnix(tc.through.Unix()),
+			userID, model.LabelValue("foo"),
+		)
+		if err != nil {
+			t.Fatal(err)
+		}
+
+		for i := range have {
+			if i <= tc.cacheableIdx {
+				require.True(t, have[i].Immutable)
+			} else {
+				require.False(t, have[i].Immutable)
+			}
+		}
+	}
+}
diff --git a/pkg/chunk/series_store.go b/pkg/chunk/series_store.go
@@ -73,6 +73,13 @@ func newSeriesStore(cfg StoreConfig, schema Schema, index IndexClient, chunks Ob
 		return nil, err
 	}
 
+	if cfg.CacheLookupsOlderThan != 0 {
+		schema = &schemaCaching{
+			Schema:         schema,
+			cacheOlderThan: cfg.CacheLookupsOlderThan,
+		}
+	}
+
 	return &seriesStore{
 		store: store{
 			cfg:     cfg,

diff --git a/pkg/chunk/storage/caching_index_client.go b/pkg/chunk/storage/caching_index_client.go
@@ -100,10 +100,18 @@ func (s *cachingIndexClient) QueryPages(ctx context.Context, queries []chunk.Ind
 			TableName: queries[0].TableName,
 			HashValue: queries[0].HashValue,
 		})
-		results[key] = ReadBatch{
+
+		rb := ReadBatch{
 			Key:    key,
 			Expiry: expiryTime.UnixNano(),
 		}
+
+		// If the query is cacheable forever, nil the expiry.
+		if queries[0].Immutable {
+			rb.Expiry = 0
+		}
+
+		results[key] = rb
 	}
 
 	err := s.IndexClient.QueryPages(ctx, cacheableMissed, func(cacheableQuery chunk.IndexQuery, r chunk.ReadBatch) bool {
@@ -232,7 +240,7 @@ func (s *cachingIndexClient) cacheFetch(ctx context.Context, keys []string) (bat
 
 		// Make sure the hash(key) is not a collision in the cache by looking at the
 		// key in the value.
-		if key != readBatch.Key || time.Now().After(time.Unix(0, readBatch.Expiry)) {
+		if key != readBatch.Key || (readBatch.Expiry != 0 && time.Now().After(time.Unix(0, readBatch.Expiry))) {
 			cacheCorruptErrs.Inc()
 			continue
 		}

diff --git a/pkg/chunk/storage/caching_index_client_test.go b/pkg/chunk/storage/caching_index_client_test.go
@@ -54,7 +54,7 @@ func TestCachingStorageClientBasic(t *testing.T) {
 	assert.EqualValues(t, 1, store.queries)
 }
 
-func TestCachingStorageClient(t *testing.T) {
+func TestTempCachingStorageClient(t *testing.T) {
 	store := &mockStore{
 		results: ReadBatch{
 			Entries: []Entry{{
@@ -64,7 +64,7 @@ func TestCachingStorageClient(t *testing.T) {
 		},
 	}
 	cache := cache.NewFifoCache("test", cache.FifoCacheConfig{Size: 10, Validity: 10 * time.Second})
-	client := newCachingIndexClient(store, cache, 1*time.Second)
+	client := newCachingIndexClient(store, cache, 100*time.Millisecond)
 	queries := []chunk.IndexQuery{
 		{TableName: "table", HashValue: "foo"},
 		{TableName: "table", HashValue: "bar"},
@@ -94,6 +94,76 @@ func TestCachingStorageClient(t *testing.T) {
 	require.NoError(t, err)
 	assert.EqualValues(t, len(queries), store.queries)
 	assert.EqualValues(t, len(queries), results)
+
+	// If we do the query after validity, it should see the queries.
+	time.Sleep(100 * time.Millisecond)
+	results = 0
+	err = client.QueryPages(context.Background(), queries, func(query chunk.IndexQuery, batch chunk.ReadBatch) bool {
+		iter := batch.Iterator()
+		for iter.Next() {
+			results++
+		}
+		return true
+	})
+	require.NoError(t, err)
+	assert.EqualValues(t, 2*len(queries), store.queries)
+	assert.EqualValues(t, len(queries), results)
+}
+
+func TestPermCachingStorageClient(t *testing.T) {
+	store := &mockStore{
+		results: ReadBatch{
+			Entries: []Entry{{
+				Column: []byte("foo"),
+				Value:  []byte("bar"),
+			}},
+		},
+	}
+	cache := cache.NewFifoCache("test", cache.FifoCacheConfig{Size: 10, Validity: 10 * time.Second})
+	client := newCachingIndexClient(store, cache, 100*time.Millisecond)
+	queries := []chunk.IndexQuery{
+		{TableName: "table", HashValue: "foo", Immutable: true},
+		{TableName: "table", HashValue: "bar", Immutable: true},
+		{TableName: "table", HashValue: "baz", Immutable: true},
+	}
+	results := 0
+	err := client.QueryPages(context.Background(), queries, func(query chunk.IndexQuery, batch chunk.ReadBatch) bool {
+		iter := batch.Iterator()
+		for iter.Next() {
+			results++
+		}
+		return true
+	})
+	require.NoError(t, err)
+	assert.EqualValues(t, len(queries), store.queries)
+	assert.EqualValues(t, len(queries), results)
+
+	// If we do the query to the cache again, the underlying store shouldn't see it.
+	results = 0
+	err = client.QueryPages(context.Background(), queries, func(query chunk.IndexQuery, batch chunk.ReadBatch) bool {
+		iter := batch.Iterator()
+		for iter.Next() {
+			results++
+		}
+		return true
+	})
+	require.NoError(t, err)
+	assert.EqualValues(t, len(queries), store.queries)
+	assert.EqualValues(t, len(queries), results)
+
+	// If we do the query after validity, it still shouldn't see the queries.
+	time.Sleep(200 * time.Millisecond)
+	results = 0
+	err = client.QueryPages(context.Background(), queries, func(query chunk.IndexQuery, batch chunk.ReadBatch) bool {
+		iter := batch.Iterator()
+		for iter.Next() {
+			results++
+		}
+		return true
+	})
+	require.NoError(t, err)
+	assert.EqualValues(t, len(queries), store.queries)
+	assert.EqualValues(t, len(queries), results)
 }
 
 func TestCachingStorageClientEmptyResponse(t *testing.T) {

diff --git a/pkg/chunk/storage/factory.go b/pkg/chunk/storage/factory.go
@@ -46,10 +46,10 @@ func (cfg *Config) RegisterFlags(f *flag.FlagSet) {
 
 	// Deprecated flags!!
 	f.IntVar(&cfg.IndexCacheSize, "store.index-cache-size", 0, "Deprecated: Use -store.index-cache-read.*; Size of in-memory index cache, 0 to disable.")
-	f.DurationVar(&cfg.IndexCacheValidity, "store.index-cache-validity", 5*time.Minute, "Deprecated: Use -store.index-cache-read.*; Period for which entries in the index cache are valid. Should be no higher than -ingester.max-chunk-idle.")
 	cfg.memcacheClient.RegisterFlagsWithPrefix("index.", "Deprecated: Use -store.index-cache-read.*;", f)
 
 	cfg.indexQueriesCacheConfig.RegisterFlagsWithPrefix("store.index-cache-read.", "Cache config for index entry reading. ", f)
+	f.DurationVar(&cfg.IndexCacheValidity, "store.index-cache-validity", 5*time.Minute, "Cache validity for active index entries. Should be no higher than -ingester.max-chunk-idle.")
 }
 
 // NewStore makes the storage clients based on the configuration.
@@ -59,7 +59,7 @@ func NewStore(cfg Config, storeCfg chunk.StoreConfig, schemaCfg chunk.SchemaConf
 	// Building up from deprecated flags.
 	var caches []cache.Cache
 	if cfg.IndexCacheSize > 0 {
-		fifocache := cache.Instrument("fifo-index", cache.NewFifoCache("index", cache.FifoCacheConfig{Size: cfg.IndexCacheSize, Validity: cfg.IndexCacheValidity}))
+		fifocache := cache.Instrument("fifo-index", cache.NewFifoCache("index", cache.FifoCacheConfig{Size: cfg.IndexCacheSize}))
 		caches = append(caches, fifocache)
 	}
 	if cfg.memcacheClient.Host != "" {
@@ -76,7 +76,6 @@ func NewStore(cfg Config, storeCfg chunk.StoreConfig, schemaCfg chunk.SchemaConf
 	var tieredCache cache.Cache
 	if len(caches) > 0 {
 		tieredCache = cache.NewTiered(caches)
-		cfg.indexQueriesCacheConfig.DefaultValidity = cfg.IndexCacheValidity
 	} else {
 		tieredCache, err = cache.New(cfg.indexQueriesCacheConfig)
 		if err != nil {