From de8f33023e156774f8be237a4dee0f1672c615cd Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 16 Jan 2020 18:22:39 -0500
Subject: [PATCH 01/25] querier.sum-shards

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 CHANGELOG.md                                  |  11 +
 docs/configuration/arguments.md               |  22 +
 docs/configuration/config-file-reference.md   |   4 +
 go.mod                                        |   1 +
 pkg/chunk/chunk_store.go                      |   3 +
 pkg/chunk/chunk_store_test.go                 |   2 +
 pkg/chunk/chunk_store_utils.go                |  17 +-
 pkg/chunk/schema.go                           |  63 +-
 pkg/chunk/schema_config.go                    |  20 +-
 pkg/chunk/schema_test.go                      |  66 ++
 pkg/chunk/schema_util.go                      |   3 +-
 pkg/chunk/schema_util_test.go                 |   2 +-
 pkg/chunk/series_store.go                     |  31 +-
 pkg/chunk/storage/caching_index_client.go     |   3 +
 pkg/cortex/modules.go                         |  29 +-
 pkg/ingester/ingester.go                      |   2 +
 pkg/querier/astmapper/astmapper.go            | 187 ++++++
 pkg/querier/astmapper/astmapper_test.go       | 102 +++
 pkg/querier/astmapper/embedded.go             | 120 ++++
 pkg/querier/astmapper/parallel.go             |  92 +++
 pkg/querier/astmapper/parallel_test.go        | 119 ++++
 pkg/querier/astmapper/shard_summer.go         | 293 ++++++++
 pkg/querier/astmapper/shard_summer_test.go    | 256 +++++++
 pkg/querier/astmapper/subtree_folder.go       | 102 +++
 pkg/querier/astmapper/subtree_folder_test.go  | 114 ++++
 pkg/querier/chunk_store_queryable.go          |   8 +-
 pkg/querier/chunk_tar_test.go                 |   8 +-
 pkg/querier/chunks_handler.go                 |   3 +-
 pkg/querier/chunkstore/chunkstore.go          |  15 +
 pkg/querier/distributor_queryable.go          |   3 +-
 pkg/querier/ingester_streaming_queryable.go   |   3 +-
 .../lazyquery.go}                             |  47 +-
 pkg/querier/matrix.go                         |   5 +-
 pkg/querier/querier.go                        |  16 +-
 pkg/querier/queryrange/promql_test.go         | 612 +++++++++++++++++
 pkg/querier/queryrange/query_range.go         |  16 +-
 pkg/querier/queryrange/query_range_test.go    |  12 +-
 pkg/querier/queryrange/queryable.go           | 120 ++++
 pkg/querier/queryrange/queryable_test.go      | 260 +++++++
 pkg/querier/queryrange/querysharding.go       | 311 +++++++++
 pkg/querier/queryrange/querysharding_test.go  | 633 ++++++++++++++++++
 pkg/querier/queryrange/results_cache.go       |   2 +-
 pkg/querier/queryrange/results_cache_test.go  |   4 +-
 pkg/querier/queryrange/roundtrip.go           |  38 +-
 pkg/querier/queryrange/roundtrip_test.go      |  37 +-
 pkg/querier/queryrange/series.go              |  55 ++
 pkg/querier/queryrange/series_test.go         |  75 +++
 pkg/querier/queryrange/test_utils.go          | 186 +++++
 pkg/querier/queryrange/test_utils_test.go     | 134 ++++
 pkg/querier/queryrange/value.go               |  73 ++
 pkg/querier/queryrange/value_test.go          | 167 +++++
 pkg/querier/remote_read_test.go               |   4 +-
 pkg/querier/{ => series}/series_set.go        |  61 +-
 pkg/querier/{ => series}/series_set_test.go   |  10 +-
 pkg/querier/unified_querier.go                |   7 +-
 tools/query-audit/auditor.go                  |  92 +++
 tools/query-audit/config.go                   |  67 ++
 tools/query-audit/example-config.yaml         |  37 +
 tools/query-audit/main.go                     |  87 +++
 tools/query-audit/runner.go                   |  32 +
 60 files changed, 4806 insertions(+), 98 deletions(-)
 create mode 100644 pkg/querier/astmapper/astmapper.go
 create mode 100644 pkg/querier/astmapper/astmapper_test.go
 create mode 100644 pkg/querier/astmapper/embedded.go
 create mode 100644 pkg/querier/astmapper/parallel.go
 create mode 100644 pkg/querier/astmapper/parallel_test.go
 create mode 100644 pkg/querier/astmapper/shard_summer.go
 create mode 100644 pkg/querier/astmapper/shard_summer_test.go
 create mode 100644 pkg/querier/astmapper/subtree_folder.go
 create mode 100644 pkg/querier/astmapper/subtree_folder_test.go
 create mode 100644 pkg/querier/chunkstore/chunkstore.go
 rename pkg/querier/{lazy_querier.go => lazyquery/lazyquery.go} (61%)
 create mode 100644 pkg/querier/queryrange/promql_test.go
 create mode 100644 pkg/querier/queryrange/queryable.go
 create mode 100644 pkg/querier/queryrange/queryable_test.go
 create mode 100644 pkg/querier/queryrange/querysharding.go
 create mode 100644 pkg/querier/queryrange/querysharding_test.go
 create mode 100644 pkg/querier/queryrange/series.go
 create mode 100644 pkg/querier/queryrange/series_test.go
 create mode 100644 pkg/querier/queryrange/test_utils.go
 create mode 100644 pkg/querier/queryrange/test_utils_test.go
 create mode 100644 pkg/querier/queryrange/value.go
 create mode 100644 pkg/querier/queryrange/value_test.go
 rename pkg/querier/{ => series}/series_set.go (64%)
 rename pkg/querier/{ => series}/series_set_test.go (88%)
 create mode 100644 tools/query-audit/auditor.go
 create mode 100644 tools/query-audit/config.go
 create mode 100644 tools/query-audit/example-config.yaml
 create mode 100644 tools/query-audit/main.go
 create mode 100644 tools/query-audit/runner.go

diff --git a/CHANGELOG.md b/CHANGELOG.md
index cbe944e7c8a..731cdb0621e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -44,6 +44,17 @@ Note that the ruler flags need to be changed in this upgrade. You're moving from
 Further, if you're using the configs service, we've upgraded the migration library and this requires some manual intervention. See full instructions below to upgrade your PostgreSQL.
 
 * [CHANGE] The frontend component now does not cache results if it finds a `Cache-Control` header and if one of its values is `no-store`. #1974
+* [FEATURE] Fan out parallelizable queries to backend queriers concurrently.
+  * `-querier.sum-shards` (bool)
+  * Requires a shard-compatible schema (v10+)
+  * This causes the number of traces to increase accordingly.
+  * The query-frontend now requires a schema config to determine how/when to shard queries, either from a file or from flags (i.e. by the `config-yaml` CLI flag). This is the same schema config the queriers consume.
+  * It's also advised to increase downstream concurrency controls as well:
+    * `querier.max-outstanding-requests-per-tenant`
+    * `querier.max-query-parallelism`
+    * `querier.max-concurrent`
+    * `server.grpc-max-concurrent-streams` (for both query-frontends and queriers)
+* [ENHANCEMENT] metric `cortex_ingester_flush_reasons` gets a new `reason` value: `Spread`, when `-ingester.spread-flushes` option is enabled.
 * [CHANGE] Flags changed with transition to upstream Prometheus rules manager:
   * `-ruler.client-timeout` is now `ruler.configs.client-timeout` in order to match `ruler.configs.url`.
   * `-ruler.group-timeout`has been removed.
diff --git a/docs/configuration/arguments.md b/docs/configuration/arguments.md
index 27633155677..f9f267050e3 100644
--- a/docs/configuration/arguments.md
+++ b/docs/configuration/arguments.md
@@ -68,6 +68,28 @@ The ingester query API was improved over time, but defaults to the old behaviour
 
 ## Query Frontend
 
+- `-querier.sum-shards`
+
+   If set to true, will cause the query frontend to mutate incoming queries when possible by turning `sum` operations into sharded `sum` operations. This requires a shard-compatible schema (v10+). An abridged example:
+   `sum by (foo) (rate(bar{baz=”blip”}[1m]))` ->
+   ```
+   sum by (foo) (
+    sum by (foo) (rate(bar{baz=”blip”,__cortex_shard__=”0of16”}[1m])) or
+    sum by (foo) (rate(bar{baz=”blip”,__cortex_shard__=”1of16”}[1m])) or
+    ...
+    sum by (foo) (rate(bar{baz=”blip”,__cortex_shard__=”15of16”}[1m]))
+   )
+   ```
+   When enabled, the query-frontend requires a schema config to determine how/when to shard queries, either from a file or from flags (i.e. by the `config-yaml` CLI flag). This is the same schema config the queriers consume.
+   It's also advised to increase downstream concurrency controls as well to account for more queries of smaller sizes:
+
+   - `querier.max-outstanding-requests-per-tenant`
+   - `querier.max-query-parallelism`
+   - `querier.max-concurrent`
+   Furthermore, both querier and query-frontend components require the `querier.query-ingesters-within` parameter to know when to start sharding requests (ingester queries are not sharded). It's recommended to align this with `ingester.max-chunk-age`.
+
+   Instrumentation (traces) also scale with the number of sharded queries and it's suggested to account for increased throughput there as well.
+
 - `-querier.align-querier-with-step`
 
    If set to true, will cause the query frontend to mutate incoming queries and align their start and end parameters to the step parameter of the query.  This improves the cacheability of the query results.
diff --git a/docs/configuration/config-file-reference.md b/docs/configuration/config-file-reference.md
index 3faf24c5b97..7ecfe25a5aa 100644
--- a/docs/configuration/config-file-reference.md
+++ b/docs/configuration/config-file-reference.md
@@ -654,6 +654,10 @@ results_cache:
 # error is returned.
 # CLI flag: -querier.max-retries-per-request
 [max_retries: <int> | default = 5]
+
+# Parse the ast and parallelize sums by shard.
+# CLI flag: -querier.sum-shards
+[sum_shards: <boolean> | default = false]
 ```
 
 ## `ruler_config`
diff --git a/go.mod b/go.mod
index 6df0f778e8c..b25c9de868c 100644
--- a/go.mod
+++ b/go.mod
@@ -72,6 +72,7 @@ require (
 	google.golang.org/api v0.14.0
 	google.golang.org/grpc v1.25.1
 	gopkg.in/yaml.v2 v2.2.5
+	sigs.k8s.io/yaml v1.1.0
 )
 
 replace github.com/Azure/azure-sdk-for-go => github.com/Azure/azure-sdk-for-go v36.2.0+incompatible
diff --git a/pkg/chunk/chunk_store.go b/pkg/chunk/chunk_store.go
index a48b842ce63..a1481d22eee 100644
--- a/pkg/chunk/chunk_store.go
+++ b/pkg/chunk/chunk_store.go
@@ -430,6 +430,9 @@ func (c *store) lookupChunksByMetricName(ctx context.Context, userID string, fro
 }
 
 func (c *store) lookupEntriesByQueries(ctx context.Context, queries []IndexQuery) ([]IndexEntry, error) {
+	log, ctx := spanlogger.New(ctx, "store.lookupEntriesByQueries")
+	defer log.Span.Finish()
+
 	var lock sync.Mutex
 	var entries []IndexEntry
 	err := c.index.QueryPages(ctx, queries, func(query IndexQuery, resp ReadBatch) bool {
diff --git a/pkg/chunk/chunk_store_test.go b/pkg/chunk/chunk_store_test.go
index b6b91de93aa..2e9cd63b58b 100644
--- a/pkg/chunk/chunk_store_test.go
+++ b/pkg/chunk/chunk_store_test.go
@@ -78,6 +78,8 @@ func newTestChunkStoreConfig(t require.TestingT, schemaName string, storeCfg Sto
 		tbmConfig TableManagerConfig
 		schemaCfg = DefaultSchemaConfig("", schemaName, 0)
 	)
+	err := schemaCfg.Validate()
+	require.NoError(t, err)
 	flagext.DefaultValues(&tbmConfig)
 	storage := NewMockStorage()
 	tableManager, err := NewTableManager(tbmConfig, schemaCfg, maxChunkAge, storage, nil)
diff --git a/pkg/chunk/chunk_store_utils.go b/pkg/chunk/chunk_store_utils.go
index 114e2b30106..89fac15dd93 100644
--- a/pkg/chunk/chunk_store_utils.go
+++ b/pkg/chunk/chunk_store_utils.go
@@ -10,6 +10,7 @@ import (
 	"github.com/prometheus/prometheus/promql"
 
 	"github.com/cortexproject/cortex/pkg/chunk/cache"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/cortexproject/cortex/pkg/util/spanlogger"
 )
@@ -146,13 +147,13 @@ func (c *Fetcher) worker() {
 // FetchChunks fetches a set of chunks from cache and store. Note that the keys passed in must be
 // lexicographically sorted, while the returned chunks are not in the same order as the passed in chunks.
 func (c *Fetcher) FetchChunks(ctx context.Context, chunks []Chunk, keys []string) ([]Chunk, error) {
-	log, ctx := spanlogger.New(ctx, "ChunkStore.fetchChunks")
+	log, ctx := spanlogger.New(ctx, "ChunkStore.FetchChunks")
 	defer log.Span.Finish()
 
 	// Now fetch the actual chunk data from Memcache / S3
 	cacheHits, cacheBufs, _ := c.cache.Fetch(ctx, keys)
 
-	fromCache, missing, err := c.processCacheResponse(chunks, cacheHits, cacheBufs)
+	fromCache, missing, err := c.processCacheResponse(ctx, chunks, cacheHits, cacheBufs)
 	if err != nil {
 		level.Warn(log).Log("msg", "error fetching from cache", "err", err)
 	}
@@ -199,12 +200,14 @@ func (c *Fetcher) writeBackCache(ctx context.Context, chunks []Chunk) error {
 
 // ProcessCacheResponse decodes the chunks coming back from the cache, separating
 // hits and misses.
-func (c *Fetcher) processCacheResponse(chunks []Chunk, keys []string, bufs [][]byte) ([]Chunk, []Chunk, error) {
+func (c *Fetcher) processCacheResponse(ctx context.Context, chunks []Chunk, keys []string, bufs [][]byte) ([]Chunk, []Chunk, error) {
 	var (
 		requests  = make([]decodeRequest, 0, len(keys))
 		responses = make(chan decodeResponse)
 		missing   []Chunk
 	)
+	log, _ := spanlogger.New(ctx, "Fetcher.processCacheResponse")
+	defer log.Span.Finish()
 
 	i, j := 0, 0
 	for i < len(chunks) && j < len(keys) {
@@ -229,6 +232,7 @@ func (c *Fetcher) processCacheResponse(chunks []Chunk, keys []string, bufs [][]b
 	for ; i < len(chunks); i++ {
 		missing = append(missing, chunks[i])
 	}
+	level.Debug(log).Log("chunks", len(chunks), "decodeRequests", len(requests), "missing", len(missing))
 
 	go func() {
 		for _, request := range requests {
@@ -252,3 +256,10 @@ func (c *Fetcher) processCacheResponse(chunks []Chunk, keys []string, bufs [][]b
 	}
 	return found, missing, err
 }
+
+func injectShardLabels(chunks []Chunk, shard astmapper.ShardAnnotation) {
+	for i, chunk := range chunks {
+		chunk.Metric = append(chunk.Metric, shard.Label())
+		chunks[i] = chunk
+	}
+}
diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index e52a5eed115..3ef4506a7d1 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -7,7 +7,11 @@ import (
 	"fmt"
 	"strings"
 
+	"strconv"
+
 	jsoniter "github.com/json-iterator/go"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 )
@@ -48,6 +52,7 @@ type Schema interface {
 	GetReadQueriesForMetric(from, through model.Time, userID string, metricName string) ([]IndexQuery, error)
 	GetReadQueriesForMetricLabel(from, through model.Time, userID string, metricName string, labelName string) ([]IndexQuery, error)
 	GetReadQueriesForMetricLabelValue(from, through model.Time, userID string, metricName string, labelName string, labelValue string) ([]IndexQuery, error)
+	FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery
 
 	// If the query resulted in series IDs, use this method to find chunks.
 	GetChunksForSeries(from, through model.Time, userID string, seriesID []byte) ([]IndexQuery, error)
@@ -116,7 +121,7 @@ func (s schema) GetCacheKeysAndLabelWriteEntries(from, through model.Time, userI
 		key := strings.Join([]string{
 			bucket.tableName,
 			bucket.hashKey,
-			string(labelsSeriesID(labels)),
+			string(LabelsSeriesID(labels)),
 		},
 			"-",
 		)
@@ -218,6 +223,10 @@ func (s schema) GetLabelNamesForSeries(from, through model.Time, userID string,
 	return result, nil
 }
 
+func (s schema) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return s.entries.FilterReadQueries(queries, shard)
+}
+
 type entries interface {
 	GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error)
 	GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error)
@@ -228,13 +237,23 @@ type entries interface {
 	GetReadMetricLabelValueQueries(bucket Bucket, metricName string, labelName string, labelValue string) ([]IndexQuery, error)
 	GetChunksForSeries(bucket Bucket, seriesID []byte) ([]IndexQuery, error)
 	GetLabelNamesForSeries(bucket Bucket, seriesID []byte) ([]IndexQuery, error)
+	FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery
+}
+
+// noops is a placeholder which can be embedded to provide default implementations
+type noops struct{}
+
+func (n noops) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
 }
 
 // original entries:
 // - hash key: <userid>:<bucket>:<metric name>
 // - range key: <label name>\0<label value>\0<chunk name>
 
-type originalEntries struct{}
+type originalEntries struct {
+	noops
+}
 
 func (originalEntries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -351,7 +370,9 @@ func (base64Entries) GetReadMetricLabelValueQueries(bucket Bucket, metricName st
 //    - range key: \0<base64(label value)>\0<chunk name>\0<version 2>
 // 2) - hash key: <userid>:<hour bucket>:<metric name>
 //    - range key: \0\0<chunk name>\0<version 3>
-type labelNameInHashKeyEntries struct{}
+type labelNameInHashKeyEntries struct {
+	noops
+}
 
 func (labelNameInHashKeyEntries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -425,7 +446,9 @@ func (labelNameInHashKeyEntries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]I
 // v5 schema is an extension of v4, with the chunk end time in the
 // range key to improve query latency.  However, it did it wrong
 // so the chunk end times are ignored.
-type v5Entries struct{}
+type v5Entries struct {
+	noops
+}
 
 func (v5Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -498,7 +521,9 @@ func (v5Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, error
 
 // v6Entries fixes issues with v5 time encoding being wrong (see #337), and
 // moves label value out of range key (see #199).
-type v6Entries struct{}
+type v6Entries struct {
+	noops
+}
 
 func (v6Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -578,6 +603,7 @@ func (v6Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, error
 
 // v9Entries adds a layer of indirection between labels -> series -> chunks.
 type v9Entries struct {
+	noops
 }
 
 func (v9Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
@@ -585,7 +611,7 @@ func (v9Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels
 }
 
 func (v9Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := labelsSeriesID(labels)
+	seriesID := LabelsSeriesID(labels)
 
 	entries := []IndexEntry{
 		// Entry for metricName -> seriesID
@@ -615,7 +641,7 @@ func (v9Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels l
 }
 
 func (v9Entries) GetChunkWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := labelsSeriesID(labels)
+	seriesID := LabelsSeriesID(labels)
 	encodedThroughBytes := encodeTime(bucket.through)
 
 	entries := []IndexEntry{
@@ -685,7 +711,7 @@ func (v10Entries) GetWriteEntries(bucket Bucket, metricName string, labels label
 }
 
 func (s v10Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := labelsSeriesID(labels)
+	seriesID := LabelsSeriesID(labels)
 
 	// read first 32 bits of the hash and use this to calculate the shard
 	shard := binary.BigEndian.Uint32(seriesID) % s.rowShards
@@ -718,7 +744,7 @@ func (s v10Entries) GetLabelWriteEntries(bucket Bucket, metricName string, label
 }
 
 func (v10Entries) GetChunkWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := labelsSeriesID(labels)
+	seriesID := LabelsSeriesID(labels)
 	encodedThroughBytes := encodeTime(bucket.through)
 
 	entries := []IndexEntry{
@@ -784,13 +810,29 @@ func (v10Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, erro
 	return nil, ErrNotSupported
 }
 
+// FilterReadQueries will return only queries that match a certain shard
+func (v10Entries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) (matches []IndexQuery) {
+	if shard == nil {
+		return queries
+	}
+
+	for _, query := range queries {
+		s := strings.Split(query.HashValue, ":")[0]
+		n, err := strconv.Atoi(s)
+		if err == nil && n == shard.Shard {
+			matches = append(matches, query)
+		}
+	}
+	return matches
+}
+
 // v11Entries builds on v10 but adds index entries for each series to store respective labels.
 type v11Entries struct {
 	v10Entries
 }
 
 func (s v11Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := labelsSeriesID(labels)
+	seriesID := LabelsSeriesID(labels)
 
 	// read first 32 bits of the hash and use this to calculate the shard
 	shard := binary.BigEndian.Uint32(seriesID) % s.rowShards
@@ -847,4 +889,5 @@ func (v11Entries) GetLabelNamesForSeries(bucket Bucket, seriesID []byte) ([]Inde
 			HashValue: string(seriesID),
 		},
 	}, nil
+
 }
diff --git a/pkg/chunk/schema_config.go b/pkg/chunk/schema_config.go
index 06312f827bf..b03de6f6c6e 100644
--- a/pkg/chunk/schema_config.go
+++ b/pkg/chunk/schema_config.go
@@ -197,10 +197,18 @@ func (cfg *SchemaConfig) Validate() error {
 			return err
 		}
 	}
-
 	return nil
 }
 
+func defaultRowShards(schema string) uint32 {
+	switch schema {
+	case "v1", "v2", "v3", "v4", "v5", "v6", "v9":
+		return 0
+	default:
+		return 16
+	}
+}
+
 // ForEachAfter will call f() on every entry after t, splitting
 // entries if necessary so there is an entry starting at t
 func (cfg *SchemaConfig) ForEachAfter(t model.Time, f func(config *PeriodConfig)) {
@@ -219,7 +227,7 @@ func (cfg *SchemaConfig) ForEachAfter(t model.Time, f func(config *PeriodConfig)
 
 // CreateSchema returns the schema defined by the PeriodConfig
 func (cfg PeriodConfig) CreateSchema() Schema {
-	rowShards := uint32(16)
+	rowShards := defaultRowShards(cfg.Schema)
 	if cfg.RowShards > 0 {
 		rowShards = cfg.RowShards
 	}
@@ -309,6 +317,14 @@ func (cfg *SchemaConfig) Load() error {
 		return err
 	}
 
+	for i, periodCfg := range cfg.Configs {
+		// apply default row shards
+		if periodCfg.RowShards == 0 {
+			periodCfg.RowShards = defaultRowShards(periodCfg.Schema)
+			cfg.Configs[i] = periodCfg
+		}
+	}
+
 	return cfg.Validate()
 }
 
diff --git a/pkg/chunk/schema_test.go b/pkg/chunk/schema_test.go
index f42b4108768..c697e321677 100644
--- a/pkg/chunk/schema_test.go
+++ b/pkg/chunk/schema_test.go
@@ -8,6 +8,7 @@ import (
 	"sort"
 	"testing"
 
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	jsoniter "github.com/json-iterator/go"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
@@ -387,5 +388,70 @@ func BenchmarkEncodeLabelsString(b *testing.B) {
 	}
 	b.Log("data size", len(data))
 	b.Log("decode", decoded)
+}
+
+// Ensure all currently defined entries can inhabit the entries interface
+func TestEnsureEntriesInhabitInterface(t *testing.T) {
+	var _ = []entries{
+		originalEntries{},
+		base64Entries{},
+		labelNameInHashKeyEntries{},
+		v5Entries{},
+		v6Entries{},
+		v9Entries{},
+		v10Entries{},
+		v11Entries{},
+	}
+}
 
+func TestV10IndexQueries(t *testing.T) {
+	fromShards := func(n int) (res []IndexQuery) {
+		for i := 0; i < n; i++ {
+			res = append(res, IndexQuery{
+				TableName:       "tbl",
+				HashValue:       fmt.Sprintf("%02d:%s:%s:%s", i, "hash", "metric", "label"),
+				RangeValueStart: []byte(string(i)),
+				ValueEqual:      []byte(string(i)),
+			})
+		}
+		return res
+	}
+
+	var testExprs = []struct {
+		name     string
+		queries  []IndexQuery
+		shard    *astmapper.ShardAnnotation
+		expected []IndexQuery
+	}{
+		{
+			name:     "passthrough when no shard specified",
+			queries:  fromShards(2),
+			shard:    nil,
+			expected: fromShards(2),
+		},
+		{
+			name:    "out of bounds shard returns 0 matches",
+			queries: fromShards(2),
+			shard: &astmapper.ShardAnnotation{
+				Shard: 3,
+			},
+			expected: nil,
+		},
+		{
+			name:    "return correct shard",
+			queries: fromShards(3),
+			shard: &astmapper.ShardAnnotation{
+				Shard: 1,
+			},
+			expected: []IndexQuery{fromShards(2)[1]},
+		},
+	}
+
+	for _, c := range testExprs {
+		t.Run(c.name, func(t *testing.T) {
+			s := v10Entries{}
+			filtered := s.FilterReadQueries(c.queries, c.shard)
+			require.Equal(t, c.expected, filtered)
+		})
+	}
 }
diff --git a/pkg/chunk/schema_util.go b/pkg/chunk/schema_util.go
index 0906288e93f..3112da100f6 100644
--- a/pkg/chunk/schema_util.go
+++ b/pkg/chunk/schema_util.go
@@ -47,7 +47,8 @@ func labelsString(ls labels.Labels) string {
 	return b.String()
 }
 
-func labelsSeriesID(ls labels.Labels) []byte {
+// LabelsSeriesID hashes a label set
+func LabelsSeriesID(ls labels.Labels) []byte {
 	h := sha256.Sum256([]byte(labelsString(ls)))
 	return encodeBase64Bytes(h[:])
 }
diff --git a/pkg/chunk/schema_util_test.go b/pkg/chunk/schema_util_test.go
index 3e5eb95a3d4..3de4b75423b 100644
--- a/pkg/chunk/schema_util_test.go
+++ b/pkg/chunk/schema_util_test.go
@@ -38,7 +38,7 @@ func TestLabelSeriesID(t *testing.T) {
 			"RBNvo1WzZ4oRRq0W9+hknpT7T8If536DEMBg9hyq/4o",
 		},
 	} {
-		seriesID := string(labelsSeriesID(c.lbls))
+		seriesID := string(LabelsSeriesID(c.lbls))
 		assert.Equal(t, c.expected, seriesID, labelsString(c.lbls))
 	}
 }
diff --git a/pkg/chunk/series_store.go b/pkg/chunk/series_store.go
index 09d3c2beb0a..11a5656850e 100644
--- a/pkg/chunk/series_store.go
+++ b/pkg/chunk/series_store.go
@@ -14,6 +14,7 @@ import (
 	"github.com/weaveworks/common/httpgrpc"
 
 	"github.com/cortexproject/cortex/pkg/chunk/cache"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/cortexproject/cortex/pkg/util/spanlogger"
 )
@@ -131,6 +132,15 @@ func (c *seriesStore) Get(ctx context.Context, userID string, from, through mode
 		return nil, err
 	}
 
+	// inject artificial __cortex_shard__ labels if present in the query. GetChunkRefs guarantees any chunk refs match the shard.
+	shard, _, err := astmapper.ShardFromMatchers(allMatchers)
+	if err != nil {
+		return nil, err
+	}
+	if shard != nil {
+		injectShardLabels(allChunks, *shard)
+	}
+
 	// Filter out chunks based on the empty matchers in the query.
 	filteredChunks := filterChunksByMatchers(allChunks, allMatchers)
 	return filteredChunks, nil
@@ -252,10 +262,21 @@ func (c *seriesStore) lookupSeriesByMetricNameMatchers(ctx context.Context, from
 	log, ctx := spanlogger.New(ctx, "SeriesStore.lookupSeriesByMetricNameMatchers", "metricName", metricName, "matchers", len(matchers))
 	defer log.Span.Finish()
 
+	// Check if one of the labels is a shard annotation, pass that information to lookupSeriesByMetricNameMatcher,
+	// and remove the label.
+	shard, shardLabelIndex, err := astmapper.ShardFromMatchers(matchers)
+	if err != nil {
+		return nil, err
+	}
+
+	if shard != nil {
+		matchers = append(matchers[:shardLabelIndex], matchers[shardLabelIndex+1:]...)
+	}
+
 	// Just get series for metric if there are no matchers
 	if len(matchers) == 0 {
 		indexLookupsPerQuery.Observe(1)
-		series, err := c.lookupSeriesByMetricNameMatcher(ctx, from, through, userID, metricName, nil)
+		series, err := c.lookupSeriesByMetricNameMatcher(ctx, from, through, userID, metricName, nil, shard)
 		if err != nil {
 			preIntersectionPerQuery.Observe(float64(len(series)))
 			postIntersectionPerQuery.Observe(float64(len(series)))
@@ -269,7 +290,7 @@ func (c *seriesStore) lookupSeriesByMetricNameMatchers(ctx context.Context, from
 	indexLookupsPerQuery.Observe(float64(len(matchers)))
 	for _, matcher := range matchers {
 		go func(matcher *labels.Matcher) {
-			ids, err := c.lookupSeriesByMetricNameMatcher(ctx, from, through, userID, metricName, matcher)
+			ids, err := c.lookupSeriesByMetricNameMatcher(ctx, from, through, userID, metricName, matcher, shard)
 			if err != nil {
 				incomingErrors <- err
 				return
@@ -320,7 +341,7 @@ func (c *seriesStore) lookupSeriesByMetricNameMatchers(ctx context.Context, from
 	return ids, nil
 }
 
-func (c *seriesStore) lookupSeriesByMetricNameMatcher(ctx context.Context, from, through model.Time, userID, metricName string, matcher *labels.Matcher) ([]string, error) {
+func (c *seriesStore) lookupSeriesByMetricNameMatcher(ctx context.Context, from, through model.Time, userID, metricName string, matcher *labels.Matcher, shard *astmapper.ShardAnnotation) ([]string, error) {
 	log, ctx := spanlogger.New(ctx, "SeriesStore.lookupSeriesByMetricNameMatcher", "metricName", metricName, "matcher", matcher)
 	defer log.Span.Finish()
 
@@ -341,6 +362,10 @@ func (c *seriesStore) lookupSeriesByMetricNameMatcher(ctx context.Context, from,
 	}
 	level.Debug(log).Log("queries", len(queries))
 
+	queries = c.schema.FilterReadQueries(queries, shard)
+
+	level.Debug(log).Log("filteredQueries", len(queries))
+
 	entries, err := c.lookupEntriesByQueries(ctx, queries)
 	if e, ok := err.(CardinalityExceededError); ok {
 		e.MetricName = metricName
diff --git a/pkg/chunk/storage/caching_index_client.go b/pkg/chunk/storage/caching_index_client.go
index f1863653b79..ab74f521784 100644
--- a/pkg/chunk/storage/caching_index_client.go
+++ b/pkg/chunk/storage/caching_index_client.go
@@ -66,6 +66,9 @@ func (s *cachingIndexClient) Stop() {
 }
 
 func (s *cachingIndexClient) QueryPages(ctx context.Context, queries []chunk.IndexQuery, callback func(chunk.IndexQuery, chunk.ReadBatch) (shouldContinue bool)) error {
+	log, ctx := spanlogger.New(ctx, "cachingIndexClient.QueryPages")
+	defer log.Finish()
+
 	// We cache the entire row, so filter client side.
 	callback = chunk_util.QueryFilter(callback)
 
diff --git a/pkg/cortex/modules.go b/pkg/cortex/modules.go
index d493e905715..5cc5f065212 100644
--- a/pkg/cortex/modules.go
+++ b/pkg/cortex/modules.go
@@ -3,6 +3,7 @@ package cortex
 import (
 	"errors"
 	"fmt"
+	"math"
 	"net/http"
 	"os"
 	"regexp"
@@ -12,6 +13,7 @@ import (
 	"github.com/prometheus/client_golang/prometheus"
 	"github.com/prometheus/common/route"
 	"github.com/prometheus/prometheus/config"
+	"github.com/prometheus/prometheus/promql"
 	v1 "github.com/prometheus/prometheus/web/api/v1"
 	httpgrpc_server "github.com/weaveworks/common/httpgrpc/server"
 	"github.com/weaveworks/common/middleware"
@@ -28,6 +30,7 @@ import (
 	"github.com/cortexproject/cortex/pkg/ingester"
 	"github.com/cortexproject/cortex/pkg/ingester/client"
 	"github.com/cortexproject/cortex/pkg/querier"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/cortexproject/cortex/pkg/querier/frontend"
 	"github.com/cortexproject/cortex/pkg/querier/queryrange"
 	"github.com/cortexproject/cortex/pkg/ring"
@@ -226,7 +229,8 @@ func (t *Cortex) stopDistributor() (err error) {
 }
 
 func (t *Cortex) initQuerier(cfg *Config) (err error) {
-	var store querier.ChunkStore
+
+	var store chunkstore.ChunkStore
 
 	if cfg.Storage.Engine == storage.StorageEngineTSDB {
 		store, err = querier.NewBlockQuerier(cfg.TSDB, cfg.Server.LogLevel, prometheus.DefaultRegisterer)
@@ -332,11 +336,32 @@ func (t *Cortex) stopStore() error {
 }
 
 func (t *Cortex) initQueryFrontend(cfg *Config) (err error) {
+	err = cfg.Schema.Load()
+	if err != nil {
+		return
+	}
+
 	t.frontend, err = frontend.New(cfg.Frontend, util.Logger)
 	if err != nil {
 		return
 	}
-	tripperware, cache, err := queryrange.NewTripperware(cfg.QueryRange, util.Logger, t.overrides, queryrange.PrometheusCodec, queryrange.PrometheusResponseExtractor)
+	tripperware, cache, err := queryrange.NewTripperware(
+		cfg.QueryRange,
+		util.Logger,
+		t.overrides,
+		queryrange.PrometheusCodec,
+		queryrange.PrometheusResponseExtractor,
+		cfg.Schema,
+		promql.EngineOpts{
+			Logger:        util.Logger,
+			Reg:           prometheus.DefaultRegisterer,
+			MaxConcurrent: int(math.MaxInt64), // the frontend's promql engine should not set any concurrency controls (these are handled by middleware)
+			MaxSamples:    cfg.Querier.MaxSamples,
+			Timeout:       cfg.Querier.Timeout,
+		},
+		cfg.Querier.IngesterMaxQueryLookback,
+	)
+
 	if err != nil {
 		return err
 	}
diff --git a/pkg/ingester/ingester.go b/pkg/ingester/ingester.go
index dcd52a9baec..3f6d586ff69 100644
--- a/pkg/ingester/ingester.go
+++ b/pkg/ingester/ingester.go
@@ -436,6 +436,7 @@ func (i *Ingester) Query(ctx context.Context, req *client.QueryRequest) (*client
 	result := &client.QueryResponse{}
 	numSeries, numSamples := 0, 0
 	maxSamplesPerQuery := i.limits.MaxSamplesPerQuery(userID)
+
 	err = state.forSeriesMatching(ctx, matchers, func(ctx context.Context, _ model.Fingerprint, series *memorySeries) error {
 		values, err := series.samplesForRange(from, through)
 		if err != nil {
@@ -518,6 +519,7 @@ func (i *Ingester) QueryStream(req *client.QueryRequest, stream client.Ingester_
 		}
 
 		numChunks += len(wireChunks)
+
 		batch = append(batch, client.TimeSeriesChunk{
 			Labels: client.FromLabelsToLabelAdapters(series.metric),
 			Chunks: wireChunks,
diff --git a/pkg/querier/astmapper/astmapper.go b/pkg/querier/astmapper/astmapper.go
new file mode 100644
index 00000000000..a93cd69161d
--- /dev/null
+++ b/pkg/querier/astmapper/astmapper.go
@@ -0,0 +1,187 @@
+package astmapper
+
+import (
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
+)
+
+// ASTMapper is the exported interface for mapping between multiple AST representations
+type ASTMapper interface {
+	Map(node promql.Node) (promql.Node, error)
+}
+
+// MapperFunc is a function adapter for ASTMapper
+type MapperFunc func(node promql.Node) (promql.Node, error)
+
+// Map applies a mapperfunc as an ASTMapper
+func (fn MapperFunc) Map(node promql.Node) (promql.Node, error) {
+	return fn(node)
+}
+
+// MultiMapper can compose multiple ASTMappers
+type MultiMapper struct {
+	mappers []ASTMapper
+}
+
+// Map impls ASTMapper
+func (m *MultiMapper) Map(node promql.Node) (promql.Node, error) {
+	var result promql.Node = node
+	var err error
+
+	if len(m.mappers) == 0 {
+		return nil, errors.New("MultiMapper: No mappers registered")
+	}
+
+	for _, x := range m.mappers {
+		result, err = x.Map(result)
+		if err != nil {
+			return nil, err
+		}
+	}
+	return result, nil
+
+}
+
+// Register adds ASTMappers into a multimapper.
+// Since registered functions are applied in the order they're registered, it's advised to register them
+// in decreasing priority and only operate on nodes that each function cares about, defaulting to CloneNode.
+func (m *MultiMapper) Register(xs ...ASTMapper) {
+	m.mappers = append(m.mappers, xs...)
+}
+
+// NewMultiMapper instaniates an ASTMapper from multiple ASTMappers
+func NewMultiMapper(xs ...ASTMapper) *MultiMapper {
+	m := &MultiMapper{}
+	m.Register(xs...)
+	return m
+}
+
+// CloneNode is a helper function to clone a node.
+func CloneNode(node promql.Node) (promql.Node, error) {
+	return promql.ParseExpr(node.String())
+}
+
+// NodeMapper either maps a single AST node or returns the unaltered node.
+// It also returns a bool to signal that no further recursion is necessary.
+// This is helpful because it allows mappers to only implement logic for node types they want to change.
+// It makes some mappers trivially easy to implement
+type NodeMapper interface {
+	MapNode(node promql.Node) (mapped promql.Node, finished bool, err error)
+}
+
+// NodeMapperFunc is an adapter for NodeMapper
+type NodeMapperFunc func(node promql.Node) (promql.Node, bool, error)
+
+// MapNode applies a NodeMapperFunc as a NodeMapper
+func (f NodeMapperFunc) MapNode(node promql.Node) (promql.Node, bool, error) {
+	return f(node)
+}
+
+// NewASTNodeMapper creates an ASTMapper from a NodeMapper
+func NewASTNodeMapper(mapper NodeMapper) ASTNodeMapper {
+	return ASTNodeMapper{mapper}
+}
+
+// ASTNodeMapper is an ASTMapper adapter which uses a NodeMapper internally.
+type ASTNodeMapper struct {
+	NodeMapper
+}
+
+// Map impls ASTMapper from a NodeMapper
+func (nm ASTNodeMapper) Map(node promql.Node) (promql.Node, error) {
+	node, fin, err := nm.MapNode(node)
+
+	if err != nil {
+		return nil, err
+	}
+
+	if fin {
+		return node, nil
+	}
+
+	switch n := node.(type) {
+	case nil:
+		// nil handles cases where we check optional fields that are not set
+		return nil, nil
+
+	case promql.Expressions:
+		for i, e := range n {
+			mapped, err := nm.Map(e)
+			if err != nil {
+				return nil, err
+			}
+			n[i] = mapped.(promql.Expr)
+		}
+		return n, nil
+
+	case *promql.AggregateExpr:
+		expr, err := nm.Map(n.Expr)
+		if err != nil {
+			return nil, err
+		}
+		n.Expr = expr.(promql.Expr)
+		return n, nil
+
+	case *promql.BinaryExpr:
+		lhs, err := nm.Map(n.LHS)
+		if err != nil {
+			return nil, err
+		}
+		n.LHS = lhs.(promql.Expr)
+
+		rhs, err := nm.Map(n.RHS)
+		if err != nil {
+			return nil, err
+		}
+		n.RHS = rhs.(promql.Expr)
+		return n, nil
+
+	case *promql.Call:
+		for i, e := range n.Args {
+			mapped, err := nm.Map(e)
+			if err != nil {
+				return nil, err
+			}
+			n.Args[i] = mapped.(promql.Expr)
+		}
+		return n, nil
+
+	case *promql.SubqueryExpr:
+		mapped, err := nm.Map(n.Expr)
+		if err != nil {
+			return nil, err
+		}
+		n.Expr = mapped.(promql.Expr)
+		return n, nil
+
+	case *promql.ParenExpr:
+		mapped, err := nm.Map(n.Expr)
+		if err != nil {
+			return nil, err
+		}
+		n.Expr = mapped.(promql.Expr)
+		return n, nil
+
+	case *promql.UnaryExpr:
+		mapped, err := nm.Map(n.Expr)
+		if err != nil {
+			return nil, err
+		}
+		n.Expr = mapped.(promql.Expr)
+		return n, nil
+
+	case *promql.EvalStmt:
+		mapped, err := nm.Map(n.Expr)
+		if err != nil {
+			return nil, err
+		}
+		n.Expr = mapped.(promql.Expr)
+		return n, nil
+
+	case *promql.NumberLiteral, *promql.StringLiteral, *promql.VectorSelector, *promql.MatrixSelector:
+		return n, nil
+
+	default:
+		panic(errors.Errorf("nodeMapper: unhandled node type %T", node))
+	}
+}
diff --git a/pkg/querier/astmapper/astmapper_test.go b/pkg/querier/astmapper/astmapper_test.go
new file mode 100644
index 00000000000..c3f0c0b9f1f
--- /dev/null
+++ b/pkg/querier/astmapper/astmapper_test.go
@@ -0,0 +1,102 @@
+package astmapper
+
+import (
+	"fmt"
+	"testing"
+
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestCloneNode(t *testing.T) {
+	var testExpr = []struct {
+		input    promql.Expr
+		expected promql.Expr
+	}{
+		// simple unmodified case
+		{
+			&promql.BinaryExpr{
+				Op:  promql.ItemADD,
+				LHS: &promql.NumberLiteral{Val: 1},
+				RHS: &promql.NumberLiteral{Val: 1},
+			},
+			&promql.BinaryExpr{
+				Op:  promql.ItemADD,
+				LHS: &promql.NumberLiteral{Val: 1},
+				RHS: &promql.NumberLiteral{Val: 1},
+			},
+		},
+		{
+			&promql.AggregateExpr{
+				Op:      promql.ItemSum,
+				Without: true,
+				Expr: &promql.VectorSelector{
+					Name: "some_metric",
+					LabelMatchers: []*labels.Matcher{
+						mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "some_metric"),
+					},
+				},
+				Grouping: []string{"foo"},
+			},
+			&promql.AggregateExpr{
+				Op:      promql.ItemSum,
+				Without: true,
+				Expr: &promql.VectorSelector{
+					Name: "some_metric",
+					LabelMatchers: []*labels.Matcher{
+						mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "some_metric"),
+					},
+				},
+				Grouping: []string{"foo"},
+			},
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			res, err := CloneNode(c.input)
+			require.NoError(t, err)
+			require.Equal(t, c.expected, res)
+		})
+	}
+}
+
+func TestCloneNode_String(t *testing.T) {
+	var testExpr = []struct {
+		input    string
+		expected string
+	}{
+		{
+			input:    `rate(http_requests_total{cluster="us-central1"}[1m])`,
+			expected: `rate(http_requests_total{cluster="us-central1"}[1m])`,
+		},
+		{
+			input: `sum(
+sum(rate(http_requests_total{cluster="us-central1"}[1m]))
+/
+sum(rate(http_requests_total{cluster="ops-tools1"}[1m]))
+)`,
+			expected: `sum(sum(rate(http_requests_total{cluster="us-central1"}[1m])) / sum(rate(http_requests_total{cluster="ops-tools1"}[1m])))`,
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			expr, err := promql.ParseExpr(c.input)
+			require.Nil(t, err)
+			res, err := CloneNode(expr)
+			require.Nil(t, err)
+			require.Equal(t, c.expected, res.String())
+		})
+	}
+}
+
+func mustLabelMatcher(mt labels.MatchType, name, val string) *labels.Matcher {
+	m, err := labels.NewMatcher(mt, name, val)
+	if err != nil {
+		panic(err)
+	}
+	return m
+}
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
new file mode 100644
index 00000000000..c8adec0b4e6
--- /dev/null
+++ b/pkg/querier/astmapper/embedded.go
@@ -0,0 +1,120 @@
+package astmapper
+
+import (
+	"encoding/json"
+	"time"
+
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+)
+
+/*
+Design:
+
+The prometheus api package enforces a (*promql.Engine argument), making it infeasible to do lazy AST
+evaluation and substitution from within this package.
+This leaves the (storage.Queryable) interface as the remaining target for conducting application level sharding.
+
+The main idea is to analyze the AST and determine which subtrees can be parallelized. With those in hand, the queries may
+be remapped into vector or matrix selectors utilizing a reserved label containing the original query. These may then be parallelized in the storage implementation.
+*/
+
+const (
+	// QueryLabel is a reserved label containing an embedded query
+	QueryLabel = "__cortex_queries__"
+	// EmbeddedQueryFlag is a reserved label (metric name) denoting an embedded query
+	EmbeddedQueryFlag = "__embedded_queries__"
+)
+
+// EmbeddedQueries is a wrapper type for encoding queries
+type EmbeddedQueries struct {
+	Concat []string `json:"Concat"`
+}
+
+// JSONCodec is a Codec impl that uses JSON representations of EmbeddedQueries structs
+var JSONCodec Codec = jsonCodec{}
+
+type jsonCodec struct{}
+
+func (c jsonCodec) Encode(queries []string) string {
+	embedded := EmbeddedQueries{
+		Concat: queries,
+	}
+	b, err := json.Marshal(embedded)
+
+	if err != nil {
+		panic(err)
+	}
+
+	return string(b)
+}
+
+func (c jsonCodec) Decode(encoded string) (queries []string, err error) {
+	var embedded EmbeddedQueries
+	err = json.Unmarshal([]byte(encoded), &embedded)
+	if err != nil {
+		return nil, err
+	}
+
+	return embedded.Concat, nil
+}
+
+// A Codec is responsible for encoding/decoding queries
+type Codec interface {
+	Encode([]string) string
+	Decode(string) ([]string, error)
+}
+
+// Squash reduces an AST into a single vector or matrix query which can be hijacked by a Queryable impl.
+func Squash(codec Codec, isMatrix bool, nodes ...promql.Node) (promql.Expr, error) {
+	if codec == nil {
+		return nil, errors.Errorf("nil Codec")
+	}
+
+	// concat OR legs
+	strs := make([]string, 0, len(nodes))
+	for _, node := range nodes {
+		strs = append(strs, node.String())
+	}
+
+	encoded := codec.Encode(strs)
+
+	embeddedQuery, err := labels.NewMatcher(labels.MatchEqual, QueryLabel, encoded)
+
+	if err != nil {
+		return nil, err
+	}
+
+	if isMatrix {
+		return &promql.MatrixSelector{
+			Name:          EmbeddedQueryFlag,
+			Range:         time.Minute,
+			LabelMatchers: []*labels.Matcher{embeddedQuery},
+		}, nil
+	}
+
+	return &promql.VectorSelector{
+		Name:          EmbeddedQueryFlag,
+		LabelMatchers: []*labels.Matcher{embeddedQuery},
+	}, nil
+}
+
+// VectorSquasher always uses a VectorSelector as the substitution node.
+// This is important because logical/set binops can only be applied against vectors and not matrices.
+func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
+	return Squash(JSONCodec, false, nodes...)
+}
+
+// OrSquasher is a custom squasher which mimics the intuitive but less efficient OR'ing of sharded vectors.
+func OrSquasher(nodes ...promql.Node) (promql.Expr, error) {
+	combined := nodes[0]
+	for i := 1; i < len(nodes); i++ {
+		combined = &promql.BinaryExpr{
+			Op:  promql.ItemLOR,
+			LHS: combined.(promql.Expr),
+			RHS: nodes[i].(promql.Expr),
+		}
+	}
+	return combined.(promql.Expr), nil
+}
diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
new file mode 100644
index 00000000000..5b42f358bcb
--- /dev/null
+++ b/pkg/querier/astmapper/parallel.go
@@ -0,0 +1,92 @@
+package astmapper
+
+import (
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
+)
+
+var summableAggregates = map[promql.ItemType]struct{}{
+	promql.ItemSum:     {},
+	promql.ItemMin:     {},
+	promql.ItemMax:     {},
+	promql.ItemTopK:    {},
+	promql.ItemBottomK: {},
+	promql.ItemCount:   {},
+}
+
+var nonParallelFuncs = []string{
+	"histogram_quantile",
+	"quantile_over_time",
+}
+
+// CanParallel tests if a subtree is parallelizable.
+// A subtree is parallelizable if all of its components are parallelizable.
+func CanParallel(node promql.Node) bool {
+	switch n := node.(type) {
+	case nil:
+		// nil handles cases where we check optional fields that are not set
+		return true
+
+	case promql.Expressions:
+		for _, e := range n {
+			if !CanParallel(e) {
+				return false
+			}
+		}
+		return true
+
+	case *promql.AggregateExpr:
+		_, ok := summableAggregates[n.Op]
+		return ok && CanParallel(n.Expr)
+
+	case *promql.BinaryExpr:
+		// since binary exprs use each side for merging, they cannot be parallelized
+		return false
+
+	case *promql.Call:
+		if n.Func == nil {
+			return false
+		}
+		if !ParallelFunc(*n.Func) {
+			return false
+		}
+
+		for _, e := range n.Args {
+			if !CanParallel(e) {
+				return false
+			}
+		}
+		return true
+
+	case *promql.SubqueryExpr:
+		return CanParallel(n.Expr)
+
+	case *promql.ParenExpr:
+		return CanParallel(n.Expr)
+
+	case *promql.UnaryExpr:
+		// Since these are only currently supported for Scalars, should be parallel-compatible
+		return true
+
+	case *promql.EvalStmt:
+		return CanParallel(n.Expr)
+
+	case *promql.MatrixSelector, *promql.NumberLiteral, *promql.StringLiteral, *promql.VectorSelector:
+		return true
+
+	default:
+		panic(errors.Errorf("CanParallel: unhandled node type %T", node))
+	}
+
+}
+
+// ParallelFunc ensures that a promql function can be part of a parallel query.
+func ParallelFunc(f promql.Function) bool {
+
+	for _, v := range nonParallelFuncs {
+		if v == f.Name {
+			return false
+		}
+	}
+	return true
+}
diff --git a/pkg/querier/astmapper/parallel_test.go b/pkg/querier/astmapper/parallel_test.go
new file mode 100644
index 00000000000..6032137f57b
--- /dev/null
+++ b/pkg/querier/astmapper/parallel_test.go
@@ -0,0 +1,119 @@
+package astmapper
+
+import (
+	"fmt"
+	"testing"
+
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestCanParallel(t *testing.T) {
+	var testExpr = []struct {
+		input    promql.Expr
+		expected bool
+	}{
+		// simple sum
+		{
+			&promql.AggregateExpr{
+				Op:      promql.ItemSum,
+				Without: true,
+				Expr: &promql.VectorSelector{
+					Name: "some_metric",
+					LabelMatchers: []*labels.Matcher{
+						mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "some_metric"),
+					},
+				},
+				Grouping: []string{"foo"},
+			},
+			true,
+		},
+		/*
+			  sum(
+				  sum by (foo) bar1{baz=”blip”}[1m])
+				/
+				  sum by (foo) bar2{baz=”blip”}[1m]))
+			  )
+		*/
+		{
+			&promql.AggregateExpr{
+				Op: promql.ItemSum,
+				Expr: &promql.BinaryExpr{
+					Op: promql.ItemDIV,
+					LHS: &promql.AggregateExpr{
+						Op:       promql.ItemSum,
+						Grouping: []string{"foo"},
+						Expr: &promql.VectorSelector{
+							Name: "idk",
+							LabelMatchers: []*labels.Matcher{
+								mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "bar1"),
+							}},
+					},
+					RHS: &promql.AggregateExpr{
+						Op:       promql.ItemSum,
+						Grouping: []string{"foo"},
+						Expr: &promql.VectorSelector{
+							Name: "idk",
+							LabelMatchers: []*labels.Matcher{
+								mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "bar2"),
+							}},
+					},
+				},
+			},
+			false,
+		},
+		// sum by (foo) bar1{baz=”blip”}[1m]) ---- this is the first leg of the above
+		{
+			&promql.AggregateExpr{
+				Op:       promql.ItemSum,
+				Grouping: []string{"foo"},
+				Expr: &promql.VectorSelector{
+					Name: "idk",
+					LabelMatchers: []*labels.Matcher{
+						mustLabelMatcher(labels.MatchEqual, string(model.MetricNameLabel), "bar1"),
+					}},
+			},
+			true,
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			res := CanParallel(c.input)
+			require.Equal(t, c.expected, res)
+		})
+	}
+}
+
+func TestCanParallel_String(t *testing.T) {
+	var testExpr = []struct {
+		input    string
+		expected bool
+	}{
+		{
+			`sum by (foo) (rate(bar1{baz="blip"}[1m]))`,
+			true,
+		},
+		{
+			`sum by (foo) (histogram_quantile(0.9, rate(http_request_duration_seconds_bucket[10m])))`,
+			false,
+		},
+		{
+			`sum by (foo) (
+			  quantile_over_time(0.9, http_request_duration_seconds_bucket[10m])
+			)`,
+			false,
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			expr, err := promql.ParseExpr(c.input)
+			require.Nil(t, err)
+			res := CanParallel(expr)
+			require.Equal(t, c.expected, res)
+		})
+	}
+}
diff --git a/pkg/querier/astmapper/shard_summer.go b/pkg/querier/astmapper/shard_summer.go
new file mode 100644
index 00000000000..4face8feb16
--- /dev/null
+++ b/pkg/querier/astmapper/shard_summer.go
@@ -0,0 +1,293 @@
+package astmapper
+
+import (
+	"fmt"
+
+	"regexp"
+
+	"strings"
+
+	"strconv"
+
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+)
+
+const (
+	// ShardLabel is a reserved label referencing a cortex shard
+	ShardLabel = "__cortex_shard__"
+	// ShardLabelFmt is the fmt of the ShardLabel key.
+	ShardLabelFmt = "%d_of_%d"
+)
+
+var (
+	// ShardLabelRE matches a value in ShardLabelFmt
+	ShardLabelRE = regexp.MustCompile("^[0-9]+_of_[0-9]+$")
+)
+
+type squasher = func(...promql.Node) (promql.Expr, error)
+
+type shardSummer struct {
+	shards   int
+	curshard *int
+	squash   squasher
+}
+
+// NewShardSummer instantiates an ASTMapper which will fan out sums queries by shard
+func NewShardSummer(shards int, squasher squasher) (ASTMapper, error) {
+	if squasher == nil {
+		return nil, errors.Errorf("squasher required and not passed")
+	}
+
+	return NewASTNodeMapper(&shardSummer{
+		shards:   shards,
+		squash:   squasher,
+		curshard: nil,
+	}), nil
+}
+
+// CopyWithCurShard clones a shardSummer with a new current shard.
+func (summer *shardSummer) CopyWithCurShard(curshard int) *shardSummer {
+	s := *summer
+	s.curshard = &curshard
+	return &s
+}
+
+// shardSummer expands a query AST by sharding and re-summing when possible
+func (summer *shardSummer) MapNode(node promql.Node) (promql.Node, bool, error) {
+
+	switch n := node.(type) {
+	case *promql.AggregateExpr:
+		if CanParallel(n) && n.Op == promql.ItemSum {
+			result, err := summer.shardSum(n)
+			return result, true, err
+		}
+
+		return n, false, nil
+
+	case *promql.VectorSelector:
+		if summer.curshard != nil {
+			mapped, err := shardVectorSelector(*summer.curshard, summer.shards, n)
+			return mapped, true, err
+		}
+		return n, true, nil
+
+	case *promql.MatrixSelector:
+		if summer.curshard != nil {
+			mapped, err := shardMatrixSelector(*summer.curshard, summer.shards, n)
+			return mapped, true, err
+		}
+		return n, true, nil
+
+	default:
+		return n, false, nil
+	}
+}
+
+// shardSum contains the logic for how we split/stitch legs of a parallelized sum query
+func (summer *shardSummer) shardSum(expr *promql.AggregateExpr) (promql.Node, error) {
+
+	parent, subSums, err := summer.splitSum(expr)
+	if err != nil {
+		return nil, err
+	}
+
+	combinedSums, err := summer.squash(subSums...)
+
+	if err != nil {
+		return nil, err
+	}
+
+	parent.Expr = combinedSums
+	return parent, nil
+}
+
+// splitSum forms the parent and child legs of a parallel query
+func (summer *shardSummer) splitSum(
+	expr *promql.AggregateExpr,
+) (
+	parent *promql.AggregateExpr,
+	children []promql.Node,
+	err error,
+) {
+	parent = &promql.AggregateExpr{
+		Op:    expr.Op,
+		Param: expr.Param,
+	}
+	var mkChild func(sharded *promql.AggregateExpr) promql.Expr
+
+	if expr.Without {
+		/*
+			parallelizing a sum using without(foo) is representable naively as
+			sum without(foo) (
+			  sum without(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum without(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)
+			or (more optimized):
+			sum without(__cortex_shard__) (
+			  sum without(foo) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum without(foo) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)
+
+		*/
+		parent.Grouping = []string{ShardLabel}
+		parent.Without = true
+		mkChild = func(sharded *promql.AggregateExpr) promql.Expr {
+			sharded.Grouping = expr.Grouping
+			sharded.Without = true
+			return sharded
+		}
+	} else if len(expr.Grouping) > 0 {
+		/*
+			parallelizing a sum using by(foo) is representable as
+			sum by(foo) (
+			  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)
+		*/
+		parent.Grouping = expr.Grouping
+		mkChild = func(sharded *promql.AggregateExpr) promql.Expr {
+			groups := make([]string, 0, len(expr.Grouping)+1)
+			groups = append(groups, expr.Grouping...)
+			groups = append(groups, ShardLabel)
+			sharded.Grouping = groups
+			return sharded
+		}
+	} else {
+		/*
+			parallelizing a non-parameterized sum is representable as
+			sum(
+			  sum without(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum without(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)
+			or (more optimized):
+			sum without(__cortex_shard__) (
+			  sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)
+		*/
+		parent.Grouping = []string{ShardLabel}
+		parent.Without = true
+		mkChild = func(sharded *promql.AggregateExpr) promql.Expr {
+			sharded.Grouping = []string{ShardLabel}
+			return sharded
+		}
+	}
+
+	// iterate across shardFactor to create children
+	for i := 0; i < summer.shards; i++ {
+		cloned, err := CloneNode(expr.Expr)
+		if err != nil {
+			return parent, children, err
+		}
+
+		subSummer := NewASTNodeMapper(summer.CopyWithCurShard(i))
+		sharded, err := subSummer.Map(cloned)
+		if err != nil {
+			return parent, children, err
+		}
+
+		subSum := mkChild(&promql.AggregateExpr{
+			Op:   expr.Op,
+			Expr: sharded.(promql.Expr),
+		})
+
+		children = append(children,
+			subSum,
+		)
+	}
+
+	return parent, children, nil
+}
+
+func shardVectorSelector(curshard, shards int, selector *promql.VectorSelector) (promql.Node, error) {
+	shardMatcher, err := labels.NewMatcher(labels.MatchEqual, ShardLabel, fmt.Sprintf(ShardLabelFmt, curshard, shards))
+	if err != nil {
+		return nil, err
+	}
+
+	return &promql.VectorSelector{
+		Name:   selector.Name,
+		Offset: selector.Offset,
+		LabelMatchers: append(
+			[]*labels.Matcher{shardMatcher},
+			selector.LabelMatchers...,
+		),
+	}, nil
+}
+
+func shardMatrixSelector(curshard, shards int, selector *promql.MatrixSelector) (promql.Node, error) {
+	shardMatcher, err := labels.NewMatcher(labels.MatchEqual, ShardLabel, fmt.Sprintf(ShardLabelFmt, curshard, shards))
+	if err != nil {
+		return nil, err
+	}
+
+	return &promql.MatrixSelector{
+		Name:   selector.Name,
+		Range:  selector.Range,
+		Offset: selector.Offset,
+		LabelMatchers: append(
+			[]*labels.Matcher{shardMatcher},
+			selector.LabelMatchers...,
+		),
+	}, nil
+}
+
+// ParseShard will extract the shard information encoded in ShardLabelFmt
+func ParseShard(input string) (parsed ShardAnnotation, err error) {
+	if !ShardLabelRE.MatchString(input) {
+		return parsed, errors.Errorf("Invalid ShardLabel value: [%s]", input)
+	}
+
+	matches := strings.Split(input, "_")
+	x, err := strconv.Atoi(matches[0])
+	if err != nil {
+		return parsed, err
+	}
+	of, err := strconv.Atoi(matches[2])
+	if err != nil {
+		return parsed, err
+	}
+
+	if x >= of {
+		return parsed, errors.Errorf("Shards out of bounds: [%d] >= [%d]", x, of)
+	}
+	return ShardAnnotation{
+		Shard: x,
+		Of:    of,
+	}, err
+}
+
+// ShardAnnotation is a convenience struct which holds data from a parsed shard label
+type ShardAnnotation struct {
+	Shard int
+	Of    int
+}
+
+// String encodes a shardAnnotation into a label value
+func (shard ShardAnnotation) String() string {
+	return fmt.Sprintf(ShardLabelFmt, shard.Shard, shard.Of)
+}
+
+// Label generates the ShardAnnotation as a label
+func (shard ShardAnnotation) Label() labels.Label {
+	return labels.Label{
+		Name:  ShardLabel,
+		Value: shard.String(),
+	}
+}
+
+// ShardFromMatchers extracts a ShardAnnotation and the index it was pulled from in the matcher list
+func ShardFromMatchers(matchers []*labels.Matcher) (shard *ShardAnnotation, idx int, err error) {
+	for i, matcher := range matchers {
+		if matcher.Name == ShardLabel && matcher.Type == labels.MatchEqual {
+			shard, err := ParseShard(matcher.Value)
+			if err != nil {
+				return nil, i, err
+			}
+			return &shard, i, nil
+		}
+	}
+	return nil, 0, nil
+}
diff --git a/pkg/querier/astmapper/shard_summer_test.go b/pkg/querier/astmapper/shard_summer_test.go
new file mode 100644
index 00000000000..9182e2d87ac
--- /dev/null
+++ b/pkg/querier/astmapper/shard_summer_test.go
@@ -0,0 +1,256 @@
+package astmapper
+
+import (
+	"fmt"
+	"testing"
+
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestShardSummer(t *testing.T) {
+	var testExpr = []struct {
+		shards   int
+		input    string
+		expected string
+	}{
+		{
+			shards: 3,
+			input:  `sum(rate(bar1{baz="blip"}[1m]))`,
+			expected: `sum without(__cortex_shard__) (
+			  sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m])) or
+			  sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m])) or
+			  sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))
+			)`,
+		},
+		{
+			shards: 3,
+			input:  `sum by(foo) (rate(bar1{baz="blip"}[1m]))`,
+			expected: `sum by(foo) (
+			  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m])) or
+			  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m])) or
+			  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))
+			)`,
+		},
+		{
+			shards: 2,
+			input: `sum(
+				sum by (foo) (rate(bar1{baz="blip"}[1m]))
+				/
+				sum by (foo) (rate(foo{baz="blip"}[1m]))
+			)`,
+			expected: `sum(
+			  sum by(foo) (
+				sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+				sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			  )
+			  /
+			  sum by(foo) (
+				sum by(foo, __cortex_shard__) (rate(foo{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+				sum by(foo, __cortex_shard__) (rate(foo{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			  )
+			)`,
+		},
+		// This nested sum example is nonsensical, but equivalent.
+		{
+			shards: 2,
+			input:  `sum(sum by(foo) (rate(bar1{baz="blip"}[1m])))`,
+			expected: `sum without(__cortex_shard__) (
+			  sum by(__cortex_shard__) (
+				sum by(foo) (
+				  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+				  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+				)
+			  ) or
+			  sum by(__cortex_shard__)(
+				sum by(foo) (
+				  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+				  sum by(foo, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+				)
+			  )
+			)`,
+		},
+		// without
+		{
+			shards: 2,
+			input:  `sum without(foo) (rate(bar1{baz="blip"}[1m]))`,
+			expected: `sum without(__cortex_shard__) (
+			  sum without(foo) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum without(foo) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)`,
+		},
+		// multiple dimensions
+		{
+			shards: 2,
+			input:  `sum by(foo, bom) (rate(bar1{baz="blip"}[1m]))`,
+			expected: `sum by(foo, bom) (
+			  sum by(foo, bom, __cortex_shard__) (rate(bar1{__cortex_shard__="0_of_2",baz="blip"}[1m])) or
+			  sum by(foo, bom, __cortex_shard__) (rate(bar1{__cortex_shard__="1_of_2",baz="blip"}[1m]))
+			)`,
+		},
+		// sharding histogram inputs
+		{
+			shards: 2,
+			input:  `histogram_quantile(0.9, sum(rate(alertmanager_http_request_duration_seconds_bucket[10m])) by (job, le))`,
+			expected: `histogram_quantile(
+				    0.9,
+				    sum by(job, le) (
+				      sum by(job, le, __cortex_shard__) (rate(alertmanager_http_request_duration_seconds_bucket{__cortex_shard__="0_of_2"}[10m])) or
+				      sum by(job, le, __cortex_shard__) (rate(alertmanager_http_request_duration_seconds_bucket{__cortex_shard__="1_of_2"}[10m]))
+				    )
+				  )`,
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+
+			summer, err := NewShardSummer(c.shards, OrSquasher)
+			require.Nil(t, err)
+			expr, err := promql.ParseExpr(c.input)
+			require.Nil(t, err)
+			res, err := summer.Map(expr)
+			require.Nil(t, err)
+
+			expected, err := promql.ParseExpr(c.expected)
+			require.Nil(t, err)
+
+			require.Equal(t, expected.String(), res.String())
+		})
+	}
+}
+
+func TestShardSummerWithEncoding(t *testing.T) {
+	for i, c := range []struct {
+		shards   int
+		input    string
+		expected string
+	}{
+		{
+			shards:   3,
+			input:    `sum(rate(bar1{baz="blip"}[1m]))`,
+			expected: `sum without(__cortex_shard__) (__embedded_queries__{__cortex_queries__="{\"Concat\":[\"sum by(__cortex_shard__) (rate(bar1{__cortex_shard__=\\\"0_of_3\\\",baz=\\\"blip\\\"}[1m]))\",\"sum by(__cortex_shard__) (rate(bar1{__cortex_shard__=\\\"1_of_3\\\",baz=\\\"blip\\\"}[1m]))\",\"sum by(__cortex_shard__) (rate(bar1{__cortex_shard__=\\\"2_of_3\\\",baz=\\\"blip\\\"}[1m]))\"]}"})`,
+		},
+	} {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			summer, err := NewShardSummer(c.shards, VectorSquasher)
+			require.Nil(t, err)
+			expr, err := promql.ParseExpr(c.input)
+			require.Nil(t, err)
+			res, err := summer.Map(expr)
+			require.Nil(t, err)
+
+			expected, err := promql.ParseExpr(c.expected)
+			require.Nil(t, err)
+
+			require.Equal(t, expected.String(), res.String())
+		})
+	}
+}
+
+func TestParseShard(t *testing.T) {
+	var testExpr = []struct {
+		input  string
+		output ShardAnnotation
+		err    bool
+	}{
+		{
+			input:  "lsdjf",
+			output: ShardAnnotation{},
+			err:    true,
+		},
+		{
+			input:  "a_of_3",
+			output: ShardAnnotation{},
+			err:    true,
+		},
+		{
+			input:  "3_of_3",
+			output: ShardAnnotation{},
+			err:    true,
+		},
+		{
+			input: "1_of_2",
+			output: ShardAnnotation{
+				Shard: 1,
+				Of:    2,
+			},
+		},
+	}
+
+	for _, c := range testExpr {
+		t.Run(fmt.Sprint(c.input), func(t *testing.T) {
+			shard, err := ParseShard(c.input)
+			if c.err {
+				require.NotNil(t, err)
+			} else {
+				require.Nil(t, err)
+				require.Equal(t, c.output, shard)
+			}
+		})
+	}
+
+}
+
+func TestShardFromMatchers(t *testing.T) {
+	var testExpr = []struct {
+		input []*labels.Matcher
+		shard *ShardAnnotation
+		idx   int
+		err   bool
+	}{
+		{
+			input: []*labels.Matcher{
+				{},
+				{
+					Name: ShardLabel,
+					Type: labels.MatchEqual,
+					Value: ShardAnnotation{
+						Shard: 10,
+						Of:    16,
+					}.String(),
+				},
+				{},
+			},
+			shard: &ShardAnnotation{
+				Shard: 10,
+				Of:    16,
+			},
+			idx: 1,
+			err: false,
+		},
+		{
+			input: []*labels.Matcher{
+				{
+					Name:  ShardLabel,
+					Type:  labels.MatchEqual,
+					Value: "invalid-fmt",
+				},
+			},
+			shard: nil,
+			idx:   0,
+			err:   true,
+		},
+		{
+			input: []*labels.Matcher{},
+			shard: nil,
+			idx:   0,
+			err:   false,
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprint(i), func(t *testing.T) {
+			shard, idx, err := ShardFromMatchers(c.input)
+			if c.err {
+				require.NotNil(t, err)
+			} else {
+				require.Nil(t, err)
+				require.Equal(t, c.shard, shard)
+				require.Equal(t, c.idx, idx)
+			}
+		})
+	}
+
+}
diff --git a/pkg/querier/astmapper/subtree_folder.go b/pkg/querier/astmapper/subtree_folder.go
new file mode 100644
index 00000000000..3f206cdd331
--- /dev/null
+++ b/pkg/querier/astmapper/subtree_folder.go
@@ -0,0 +1,102 @@
+package astmapper
+
+import (
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
+)
+
+/*
+subtreeFolder is a NodeMapper which embeds an entire promql.Node in an embedded query
+if it does not contain any previously embedded queries. This allows the frontend to "zip up" entire
+subtrees of an AST that have not already been parallelized.
+
+*/
+type subtreeFolder struct {
+	codec Codec
+}
+
+// NewSubtreeFolder creates a subtreeFolder with a specified codec
+func NewSubtreeFolder(codec Codec) (ASTMapper, error) {
+	if codec == nil {
+		return nil, errors.New("nil codec")
+	}
+	return NewASTNodeMapper(&subtreeFolder{
+		codec: JSONCodec,
+	}), nil
+}
+
+// MapNode impls NodeMapper
+func (f *subtreeFolder) MapNode(node promql.Node) (promql.Node, bool, error) {
+	switch n := node.(type) {
+	// do not attempt to fold number or string leaf nodes
+	case *promql.NumberLiteral, *promql.StringLiteral:
+		return n, true, nil
+	}
+
+	containsEmbedded, err := Predicate(node, predicate(isEmbedded))
+	if err != nil {
+		return nil, true, err
+	}
+
+	if containsEmbedded {
+		return node, false, nil
+	}
+
+	expr, err := VectorSquasher(node)
+	return expr, true, err
+}
+
+func isEmbedded(node promql.Node) (bool, error) {
+	switch n := node.(type) {
+	case *promql.VectorSelector:
+		if n.Name == EmbeddedQueryFlag {
+			return true, nil
+		}
+
+	case *promql.MatrixSelector:
+		if n.Name == EmbeddedQueryFlag {
+			return true, nil
+		}
+
+	}
+	return false, nil
+}
+
+type predicate = func(promql.Node) (bool, error)
+
+// Predicate is a helper which uses promql.Walk under the hood determine if any node in a subtree
+// returns true for a specified function
+func Predicate(node promql.Node, fn predicate) (bool, error) {
+	v := &visitor{
+		fn: fn,
+	}
+
+	if err := promql.Walk(v, node, nil); err != nil {
+		return false, err
+	}
+	return v.result, nil
+}
+
+type visitor struct {
+	fn     predicate
+	result bool
+}
+
+// Visit impls promql.Visitor
+func (v *visitor) Visit(node promql.Node, path []promql.Node) (promql.Visitor, error) {
+	// if the visitor has already seen a predicate success, don't overwrite
+	if v.result {
+		return nil, nil
+	}
+
+	var err error
+
+	v.result, err = v.fn(node)
+	if err != nil {
+		return nil, err
+	}
+	if v.result {
+		return nil, nil
+	}
+	return v, nil
+}
diff --git a/pkg/querier/astmapper/subtree_folder_test.go b/pkg/querier/astmapper/subtree_folder_test.go
new file mode 100644
index 00000000000..0a22619d34c
--- /dev/null
+++ b/pkg/querier/astmapper/subtree_folder_test.go
@@ -0,0 +1,114 @@
+package astmapper
+
+import (
+	"fmt"
+	"testing"
+
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestPredicate(t *testing.T) {
+	for i, tc := range []struct {
+		input    string
+		fn       predicate
+		expected bool
+		err      bool
+	}{
+		{
+			input: "selector1{} or selector2{}",
+			fn: predicate(func(node promql.Node) (bool, error) {
+				return false, errors.New("some err")
+			}),
+			expected: false,
+			err:      true,
+		},
+		{
+			input: "selector1{} or selector2{}",
+			fn: predicate(func(node promql.Node) (bool, error) {
+				return false, nil
+			}),
+			expected: false,
+			err:      false,
+		},
+		{
+			input: "selector1{} or selector2{}",
+			fn: predicate(func(node promql.Node) (bool, error) {
+				return true, nil
+			}),
+			expected: true,
+			err:      false,
+		},
+		{
+			input:    `sum without(__cortex_shard__) (__embedded_queries__{__cortex_queries__="tstquery"}) or sum(selector)`,
+			fn:       predicate(isEmbedded),
+			expected: true,
+			err:      false,
+		},
+	} {
+		t.Run(fmt.Sprintf("%d", i), func(t *testing.T) {
+			expr, err := promql.ParseExpr(tc.input)
+			require.Nil(t, err)
+
+			res, err := Predicate(expr.(promql.Node), tc.fn)
+			if tc.err {
+				require.Error(t, err)
+			} else {
+				require.Nil(t, err)
+			}
+
+			require.Equal(t, tc.expected, res)
+		})
+	}
+}
+
+func TestSubtreeMapper(t *testing.T) {
+	for i, tc := range []struct {
+		input    string
+		expected string
+	}{
+		// embed an entire histogram
+		{
+			input:    "histogram_quantile(0.5, rate(alertmanager_http_request_duration_seconds_bucket[1m]))",
+			expected: `__embedded_queries__{__cortex_queries__="{\"Concat\":[\"histogram_quantile(0.5, rate(alertmanager_http_request_duration_seconds_bucket[1m]))\"]}"}`,
+		},
+		// embed a binary expression across two functions
+		{
+			input:    `rate(http_requests_total{cluster="eu-west2"}[5m]) or rate(http_requests_total{cluster="us-central1"}[5m])`,
+			expected: `__embedded_queries__{__cortex_queries__="{\"Concat\":[\"rate(http_requests_total{cluster=\\\"eu-west2\\\"}[5m]) or rate(http_requests_total{cluster=\\\"us-central1\\\"}[5m])\"]}"}`,
+		},
+
+		// the first leg (histogram) hasn't been embedded at any level, so embed that, but ignore the right leg
+		// which has already been embedded.
+		{
+			input: `sum(histogram_quantile(0.5, rate(selector[1m]))) +
+				sum without(__cortex_shard__) (__embedded_queries__{__cortex_queries__="tstquery"})`,
+			expected: `
+			  __embedded_queries__{__cortex_queries__="{\"Concat\":[\"sum(histogram_quantile(0.5, rate(selector[1m])))\"]}"} +
+			  sum without(__cortex_shard__) (__embedded_queries__{__cortex_queries__="tstquery"})
+`,
+		},
+		// should not embed scalars
+		{
+			input:    `histogram_quantile(0.5, __embedded_queries__{__cortex_queries__="tstquery"})`,
+			expected: `histogram_quantile(0.5, __embedded_queries__{__cortex_queries__="tstquery"})`,
+		},
+	} {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			mapper, err := NewSubtreeFolder(JSONCodec)
+			require.Nil(t, err)
+
+			expr, err := promql.ParseExpr(tc.input)
+			require.Nil(t, err)
+			res, err := mapper.Map(expr)
+			require.Nil(t, err)
+
+			expected, err := promql.ParseExpr(tc.expected)
+			require.Nil(t, err)
+
+			require.Equal(t, expected.String(), res.String())
+
+		})
+	}
+}
diff --git a/pkg/querier/chunk_store_queryable.go b/pkg/querier/chunk_store_queryable.go
index 65f0acca46c..853ea7cecda 100644
--- a/pkg/querier/chunk_store_queryable.go
+++ b/pkg/querier/chunk_store_queryable.go
@@ -12,11 +12,13 @@ import (
 	"github.com/cortexproject/cortex/pkg/ingester/client"
 
 	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
+	seriesset "github.com/cortexproject/cortex/pkg/querier/series"
 )
 
 type chunkIteratorFunc func(chunks []chunk.Chunk, from, through model.Time) storage.SeriesIterator
 
-func newChunkStoreQueryable(store ChunkStore, chunkIteratorFunc chunkIteratorFunc) storage.Queryable {
+func newChunkStoreQueryable(store chunkstore.ChunkStore, chunkIteratorFunc chunkIteratorFunc) storage.Queryable {
 	return storage.QueryableFunc(func(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
 		return &chunkStoreQuerier{
 			store:             store,
@@ -29,7 +31,7 @@ func newChunkStoreQueryable(store ChunkStore, chunkIteratorFunc chunkIteratorFun
 }
 
 type chunkStoreQuerier struct {
-	store             ChunkStore
+	store             chunkstore.ChunkStore
 	chunkIteratorFunc chunkIteratorFunc
 	ctx               context.Context
 	mint, maxt        int64
@@ -66,7 +68,7 @@ func (q *chunkStoreQuerier) partitionChunks(chunks []chunk.Chunk) storage.Series
 		})
 	}
 
-	return newConcreteSeriesSet(series)
+	return seriesset.NewConcreteSeriesSet(series)
 }
 
 func (q *chunkStoreQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
diff --git a/pkg/querier/chunk_tar_test.go b/pkg/querier/chunk_tar_test.go
index 245c0cf5f26..275cb1e36a2 100644
--- a/pkg/querier/chunk_tar_test.go
+++ b/pkg/querier/chunk_tar_test.go
@@ -11,6 +11,10 @@ import (
 	"testing"
 	"time"
 
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/batch"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
+	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
@@ -21,7 +25,7 @@ import (
 	"github.com/cortexproject/cortex/pkg/util"
 )
 
-func getTarDataFromEnv(t testing.TB) (query string, from, through time.Time, step time.Duration, store ChunkStore) {
+func getTarDataFromEnv(t testing.TB) (query string, from, through time.Time, step time.Duration, store chunkstore.ChunkStore) {
 	var (
 		err            error
 		chunksFilename = os.Getenv("CHUNKS")
@@ -48,7 +52,7 @@ func getTarDataFromEnv(t testing.TB) (query string, from, through time.Time, ste
 	return query, from, through, step, &mockChunkStore{chunks}
 }
 
-func runRangeQuery(t testing.TB, query string, from, through time.Time, step time.Duration, store ChunkStore) {
+func runRangeQuery(t testing.TB, query string, from, through time.Time, step time.Duration, store chunkstore.ChunkStore) {
 	if len(query) == 0 || store == nil {
 		return
 	}
diff --git a/pkg/querier/chunks_handler.go b/pkg/querier/chunks_handler.go
index d91ed8eb58c..ea694ae12b0 100644
--- a/pkg/querier/chunks_handler.go
+++ b/pkg/querier/chunks_handler.go
@@ -10,6 +10,7 @@ import (
 	"github.com/prometheus/prometheus/storage"
 	"github.com/weaveworks/common/user"
 
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/cortexproject/cortex/pkg/querier/queryrange"
 )
 
@@ -48,7 +49,7 @@ func ChunksHandler(queryable storage.Queryable) http.Handler {
 			return
 		}
 
-		store, ok := querier.(ChunkStore)
+		store, ok := querier.(chunkstore.ChunkStore)
 		if !ok {
 			http.Error(w, "not supported", http.StatusServiceUnavailable)
 			return
diff --git a/pkg/querier/chunkstore/chunkstore.go b/pkg/querier/chunkstore/chunkstore.go
new file mode 100644
index 00000000000..3b1045ef0d6
--- /dev/null
+++ b/pkg/querier/chunkstore/chunkstore.go
@@ -0,0 +1,15 @@
+package chunkstore
+
+import (
+	"context"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
+)
+
+// ChunkStore is the read-interface to the Chunk Store.  Made an interface here
+// to reduce package coupling.
+type ChunkStore interface {
+	Get(ctx context.Context, userID string, from, through model.Time, matchers ...*labels.Matcher) ([]chunk.Chunk, error)
+}
diff --git a/pkg/querier/distributor_queryable.go b/pkg/querier/distributor_queryable.go
index c52d67b05be..b941cf5eb4f 100644
--- a/pkg/querier/distributor_queryable.go
+++ b/pkg/querier/distributor_queryable.go
@@ -10,6 +10,7 @@ import (
 
 	"github.com/cortexproject/cortex/pkg/ingester/client"
 	"github.com/cortexproject/cortex/pkg/prom1/storage/metric"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 )
 
 // Distributor is the read interface to the distributor, made an interface here
@@ -51,7 +52,7 @@ func (q *distributorQuerier) Select(sp *storage.SelectParams, matchers ...*label
 		return nil, nil, promql.ErrStorage{Err: err}
 	}
 
-	return matrixToSeriesSet(matrix), nil, nil
+	return series.MatrixToSeriesSet(matrix), nil, nil
 }
 
 func (q *distributorQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
diff --git a/pkg/querier/ingester_streaming_queryable.go b/pkg/querier/ingester_streaming_queryable.go
index 08b18f9ec9f..78263e5025a 100644
--- a/pkg/querier/ingester_streaming_queryable.go
+++ b/pkg/querier/ingester_streaming_queryable.go
@@ -13,6 +13,7 @@ import (
 
 	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/ingester/client"
+	seriesset "github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/cortexproject/cortex/pkg/util/chunkcompat"
 )
 
@@ -110,5 +111,5 @@ func (q *ingesterStreamingQuerier) Select(sp *storage.SelectParams, matchers ...
 		serieses = append(serieses, series)
 	}
 
-	return newConcreteSeriesSet(serieses), nil, nil
+	return seriesset.NewConcreteSeriesSet(serieses), nil, nil
 }
diff --git a/pkg/querier/lazy_querier.go b/pkg/querier/lazyquery/lazyquery.go
similarity index 61%
rename from pkg/querier/lazy_querier.go
rename to pkg/querier/lazyquery/lazyquery.go
index bbc667d4072..ba8a43ceaf2 100644
--- a/pkg/querier/lazy_querier.go
+++ b/pkg/querier/lazyquery/lazyquery.go
@@ -1,9 +1,11 @@
-package querier
+package lazyquery
 
 import (
 	"context"
 	"fmt"
 
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/storage"
@@ -11,16 +13,38 @@ import (
 	"github.com/cortexproject/cortex/pkg/chunk"
 )
 
-type lazyQuerier struct {
+// LazyQueryable wraps a storage.Queryable
+type LazyQueryable struct {
+	q storage.Queryable
+}
+
+// Querier impls storage.Queryable
+func (lq LazyQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
+	q, err := lq.q.Querier(ctx, mint, maxt)
+	if err != nil {
+		return nil, err
+	}
+
+	return NewLazyQuerier(q), nil
+}
+
+// NewLazyQueryable returns a lazily wrapped queryable
+func NewLazyQueryable(q storage.Queryable) storage.Queryable {
+	return LazyQueryable{q}
+}
+
+// LazyQuerier is a lazy-loaded adapter for a storage.Querier
+type LazyQuerier struct {
 	next storage.Querier
 }
 
-// newLazyQuerier wraps a storage.Querier, does the Select in the background.
+// NewLazyQuerier wraps a storage.Querier, does the Select in the background.
 // Return value cannot be used from more than one goroutine simultaneously.
-func newLazyQuerier(next storage.Querier) storage.Querier {
-	return lazyQuerier{next}
+func NewLazyQuerier(next storage.Querier) storage.Querier {
+	return LazyQuerier{next}
 }
 
+// Select impls Storage.Querier
 func (l lazyQuerier) Select(params *storage.SelectParams, matchers ...*labels.Matcher) (storage.SeriesSet, storage.Warnings, error) {
 	// make sure there is space in the buffer, to unblock the goroutine and let it die even if nobody is
 	// waiting for the result yet (or anymore).
@@ -38,21 +62,24 @@ func (l lazyQuerier) Select(params *storage.SelectParams, matchers ...*labels.Ma
 	}, nil, nil
 }
 
-func (l lazyQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
+// LabelValues impls Storage.Querier
+func (l LazyQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
 	return l.next.LabelValues(name)
 }
 
-func (l lazyQuerier) LabelNames() ([]string, storage.Warnings, error) {
+// LabelNames impls Storage.Querier
+func (l LazyQuerier) LabelNames() ([]string, storage.Warnings, error) {
 	return l.next.LabelNames()
 }
 
-func (l lazyQuerier) Close() error {
+// Close impls Storage.Querier
+func (l LazyQuerier) Close() error {
 	return l.next.Close()
 }
 
 // Get implements ChunkStore for the chunk tar HTTP handler.
-func (l lazyQuerier) Get(ctx context.Context, userID string, from, through model.Time, matchers ...*labels.Matcher) ([]chunk.Chunk, error) {
-	store, ok := l.next.(ChunkStore)
+func (l LazyQuerier) Get(ctx context.Context, userID string, from, through model.Time, matchers ...*labels.Matcher) ([]chunk.Chunk, error) {
+	store, ok := l.next.(chunkstore.ChunkStore)
 	if !ok {
 		return nil, fmt.Errorf("not supported")
 	}
diff --git a/pkg/querier/matrix.go b/pkg/querier/matrix.go
index c6bd9d0ec3f..8ac963ad5ac 100644
--- a/pkg/querier/matrix.go
+++ b/pkg/querier/matrix.go
@@ -5,6 +5,7 @@ import (
 	"github.com/prometheus/prometheus/storage"
 
 	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/cortexproject/cortex/pkg/util"
 )
 
@@ -13,12 +14,12 @@ func mergeChunks(chunks []chunk.Chunk, from, through model.Time) storage.SeriesI
 	for _, c := range chunks {
 		ss, err := c.Samples(from, through)
 		if err != nil {
-			return errIterator{err}
+			return series.NewErrIterator(err)
 		}
 
 		samples = append(samples, ss)
 	}
 
 	merged := util.MergeNSampleSets(samples...)
-	return newConcreteSeriesIterator(newConcreteSeries(nil, merged))
+	return series.NewConcreteSeriesIterator(series.NewConcreteSeries(nil, merged))
 }
diff --git a/pkg/querier/querier.go b/pkg/querier/querier.go
index 3a789873927..6b0984e918b 100644
--- a/pkg/querier/querier.go
+++ b/pkg/querier/querier.go
@@ -12,9 +12,11 @@ import (
 	"github.com/prometheus/prometheus/promql"
 	"github.com/prometheus/prometheus/storage"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/querier/batch"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/cortexproject/cortex/pkg/querier/iterators"
+	"github.com/cortexproject/cortex/pkg/querier/lazyquery"
+	seriesset "github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/cortexproject/cortex/pkg/util"
 )
 
@@ -74,14 +76,8 @@ func (cfg *Config) Validate() error {
 	return nil
 }
 
-// ChunkStore is the read-interface to the Chunk Store.  Made an interface here
-// to reduce package coupling.
-type ChunkStore interface {
-	Get(ctx context.Context, userID string, from, through model.Time, matchers ...*labels.Matcher) ([]chunk.Chunk, error)
-}
-
 // New builds a queryable and promql engine.
-func New(cfg Config, distributor Distributor, chunkStore ChunkStore) (storage.Queryable, *promql.Engine) {
+func New(cfg Config, distributor Distributor, chunkStore chunkstore.ChunkStore) (storage.Queryable, *promql.Engine) {
 	iteratorFunc := mergeChunks
 	if cfg.BatchIterators {
 		iteratorFunc = batch.NewChunkMergeIterator
@@ -104,7 +100,7 @@ func New(cfg Config, distributor Distributor, chunkStore ChunkStore) (storage.Qu
 		if err != nil {
 			return nil, err
 		}
-		return newLazyQuerier(querier), nil
+		return lazyquery.NewLazyQuerier(querier), nil
 	})
 
 	promql.SetDefaultEvaluationInterval(cfg.DefaultEvaluationInterval)
@@ -210,7 +206,7 @@ func (q querier) metadataQuery(matchers ...*labels.Matcher) (storage.SeriesSet,
 	if err != nil {
 		return nil, nil, err
 	}
-	return metricsToSeriesSet(ms), nil, nil
+	return seriesset.MetricsToSeriesSet(ms), nil, nil
 }
 
 func (querier) Close() error {
diff --git a/pkg/querier/queryrange/promql_test.go b/pkg/querier/queryrange/promql_test.go
new file mode 100644
index 00000000000..359d3922862
--- /dev/null
+++ b/pkg/querier/queryrange/promql_test.go
@@ -0,0 +1,612 @@
+package queryrange
+
+import (
+	"context"
+	"fmt"
+	"math"
+	"sort"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/util"
+	"github.com/prometheus/client_golang/prometheus"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/prometheus/prometheus/storage"
+	"github.com/stretchr/testify/require"
+)
+
+var (
+	start  = time.Unix(1000, 0)
+	end    = start.Add(3 * time.Minute)
+	step   = 30 * time.Second
+	ctx    = context.Background()
+	engine = promql.NewEngine(promql.EngineOpts{
+		Reg:                prometheus.DefaultRegisterer,
+		MaxConcurrent:      1000,
+		Logger:             util.Logger,
+		Timeout:            1 * time.Hour,
+		MaxSamples:         10e6,
+		ActiveQueryTracker: nil,
+	})
+)
+
+// This test allows to verify which PromQL expressions can be parallelized.
+func Test_PromQL(t *testing.T) {
+	t.Parallel()
+
+	var tests = []struct {
+		normalQuery string
+		shardQuery  string
+		shouldEqual bool
+	}{
+		// Vector can be parallelized but we need to remove the cortex shard label.
+		// It should be noted that the __cortex_shard__ label is required by the engine
+		// and therefore should be returned by the storage.
+		// Range vectors `bar1{baz="blip"}[1m]` are not tested here because it is not supported
+		// by range queries.
+		{
+			`bar1{baz="blip"}`,
+			`label_replace(
+				bar1{__cortex_shard__="0_of_3",baz="blip"} or
+				bar1{__cortex_shard__="1_of_3",baz="blip"} or
+				bar1{__cortex_shard__="2_of_3",baz="blip"},
+				"__cortex_shard__","","",""
+			)`,
+			true,
+		},
+		// __cortex_shard__ label is required otherwise the or will keep only the first series.
+		{
+			`sum(bar1{baz="blip"})`,
+			`sum(
+				sum (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				sum (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				sum (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			false,
+		},
+		{
+			`sum(bar1{baz="blip"})`,
+			`sum(
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		{
+			`sum by (foo) (bar1{baz="blip"})`,
+			`sum by (foo) (
+				sum by(foo,__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				sum by(foo,__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				sum by(foo,__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		{
+			`sum by (foo,bar) (bar1{baz="blip"})`,
+			`sum by (foo,bar)(
+				sum by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				sum by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				sum by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		// since series are unique to a shard, it's safe to sum without shard first, then reaggregate
+		{
+			`sum without (foo,bar) (bar1{baz="blip"})`,
+			`sum without (foo,bar)(
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				sum without(__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		{
+			`min by (foo,bar) (bar1{baz="blip"})`,
+			`min by (foo,bar)(
+				min by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				min by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				min by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		{
+			`max by (foo,bar) (bar1{baz="blip"})`,
+			` max by (foo,bar)(
+				max by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				max by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				max by(foo,bar,__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			true,
+		},
+		// avg generally cant be parallelized
+		{
+			`avg(bar1{baz="blip"})`,
+			`avg(
+				avg by(__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				avg by(__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				avg by(__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			false,
+		},
+		// stddev can't be parallelized.
+		{
+			`stddev(bar1{baz="blip"})`,
+			` stddev(
+				stddev by(__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				stddev by(__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				stddev by(__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			false,
+		},
+		// stdvar can't be parallelized.
+		{
+			`stdvar(bar1{baz="blip"})`,
+			`stdvar(
+				stdvar by(__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				stdvar by(__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				stdvar by(__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			  )`,
+			false,
+		},
+		{
+			`count(bar1{baz="blip"})`,
+			`count(
+				count without (__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+				)`,
+			true,
+		},
+		{
+			`count by (foo,bar) (bar1{baz="blip"})`,
+			`count by (foo,bar) (
+				count by (foo,bar,__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				count by (foo,bar,__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				count by (foo,bar,__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			)`,
+			true,
+		},
+		// different ways to represent count without.
+		{
+			`count without (foo) (bar1{baz="blip"})`,
+			`count without (foo) (
+				count without (__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			)`,
+			true,
+		},
+		{
+			`count without (foo) (bar1{baz="blip"})`,
+			`sum without (__cortex_shard__) (
+				count without (foo) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				count without (foo) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				count without (foo) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			)`,
+			true,
+		},
+		{
+			`count without (foo, bar) (bar1{baz="blip"})`,
+			`count without (foo, bar) (
+				count without (__cortex_shard__) (bar1{__cortex_shard__="0_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="1_of_3",baz="blip"}) or
+				count without (__cortex_shard__) (bar1{__cortex_shard__="2_of_3",baz="blip"})
+			)`,
+			true,
+		},
+		{
+			`topk(2,bar1{baz="blip"})`,
+			`label_replace(
+				topk(2,
+					topk(2,(bar1{__cortex_shard__="0_of_3",baz="blip"})) without(__cortex_shard__) or
+					topk(2,(bar1{__cortex_shard__="1_of_3",baz="blip"})) without(__cortex_shard__) or
+					topk(2,(bar1{__cortex_shard__="2_of_3",baz="blip"})) without(__cortex_shard__)
+				),
+                          "__cortex_shard__","","","")`,
+			true,
+		},
+		{
+			`bottomk(2,bar1{baz="blip"})`,
+			`label_replace(
+				bottomk(2,
+					bottomk(2,(bar1{__cortex_shard__="0_of_3",baz="blip"})) without(__cortex_shard__) or
+					bottomk(2,(bar1{__cortex_shard__="1_of_3",baz="blip"})) without(__cortex_shard__) or
+					bottomk(2,(bar1{__cortex_shard__="2_of_3",baz="blip"})) without(__cortex_shard__)
+				),
+                          "__cortex_shard__","","","")`,
+			true,
+		},
+		{
+			`sum by (foo,bar) (avg_over_time(bar1{baz="blip"}[1m]))`,
+			`sum by (foo,bar)(
+				sum by(foo,bar,__cortex_shard__) (avg_over_time(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m])) or
+				sum by(foo,bar,__cortex_shard__) (avg_over_time(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m])) or
+				sum by(foo,bar,__cortex_shard__) (avg_over_time(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))
+			  )`,
+			true,
+		},
+		{
+			`sum by (foo,bar) (min_over_time(bar1{baz="blip"}[1m]))`,
+			`sum by (foo,bar)(
+				sum by(foo,bar,__cortex_shard__) (min_over_time(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m])) or
+				sum by(foo,bar,__cortex_shard__) (min_over_time(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m])) or
+				sum by(foo,bar,__cortex_shard__) (min_over_time(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))
+			  )`,
+			true,
+		},
+	}
+
+	for _, tt := range tests {
+		tt := tt
+		t.Run(tt.normalQuery, func(t *testing.T) {
+
+			baseQuery, err := engine.NewRangeQuery(shardAwareQueryable, tt.normalQuery, start, end, step)
+			require.Nil(t, err)
+			shardQuery, err := engine.NewRangeQuery(shardAwareQueryable, tt.shardQuery, start, end, step)
+			require.Nil(t, err)
+			baseResult := baseQuery.Exec(ctx)
+			shardResult := shardQuery.Exec(ctx)
+			t.Logf("base: %v\n", baseResult)
+			t.Logf("shard: %v\n", shardResult)
+			if tt.shouldEqual {
+				require.Equal(t, baseResult, shardResult)
+				return
+			}
+			require.NotEqual(t, baseResult, shardResult)
+		})
+	}
+
+}
+
+func Test_FunctionParallelism(t *testing.T) {
+	tpl := `sum(<fn>(bar1{}<fArgs>))`
+	shardTpl := `sum(
+				sum without(__cortex_shard__) (<fn>(bar1{__cortex_shard__="0_of_3"}<fArgs>)) or
+				sum without(__cortex_shard__) (<fn>(bar1{__cortex_shard__="1_of_3"}<fArgs>)) or
+				sum without(__cortex_shard__) (<fn>(bar1{__cortex_shard__="2_of_3"}<fArgs>))
+			  )`
+
+	mkQuery := func(tpl, fn string, testMatrix bool, fArgs []string) (result string) {
+		result = strings.Replace(tpl, "<fn>", fn, -1)
+
+		if testMatrix {
+			// turn selectors into ranges
+			result = strings.Replace(result, "}<fArgs>", "}[1m]<fArgs>", -1)
+		}
+
+		if len(fArgs) > 0 {
+			args := "," + strings.Join(fArgs, ",")
+			result = strings.Replace(result, "<fArgs>", args, -1)
+		} else {
+			result = strings.Replace(result, "<fArgs>", "", -1)
+		}
+
+		return result
+	}
+
+	for _, tc := range []struct {
+		fn           string
+		fArgs        []string
+		isTestMatrix bool
+		approximate  bool
+	}{
+		{
+			fn: "abs",
+		},
+		{
+			fn: "absent",
+		},
+		{
+			fn:           "avg_over_time",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn: "ceil",
+		},
+		{
+			fn:           "changes",
+			isTestMatrix: true,
+		},
+		{
+			fn:           "count_over_time",
+			isTestMatrix: true,
+		},
+		{
+			fn: "days_in_month",
+		},
+		{
+			fn: "day_of_month",
+		},
+		{
+			fn: "day_of_week",
+		},
+		{
+			fn:           "delta",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "deriv",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:          "exp",
+			approximate: true,
+		},
+		{
+			fn: "floor",
+		},
+		{
+			fn: "hour",
+		},
+		{
+			fn:           "idelta",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "increase",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "irate",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:          "ln",
+			approximate: true,
+		},
+		{
+			fn:          "log10",
+			approximate: true,
+		},
+		{
+			fn:          "log2",
+			approximate: true,
+		},
+		{
+			fn:           "max_over_time",
+			isTestMatrix: true,
+		},
+		{
+			fn:           "min_over_time",
+			isTestMatrix: true,
+		},
+		{
+			fn: "minute",
+		},
+		{
+			fn: "month",
+		},
+		{
+			fn:           "rate",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "resets",
+			isTestMatrix: true,
+		},
+		{
+			fn: "sort",
+		},
+		{
+			fn: "sort_desc",
+		},
+		{
+			fn:          "sqrt",
+			approximate: true,
+		},
+		{
+			fn:           "stddev_over_time",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "stdvar_over_time",
+			isTestMatrix: true,
+			approximate:  true,
+		},
+		{
+			fn:           "sum_over_time",
+			isTestMatrix: true,
+		},
+		{
+			fn: "timestamp",
+		},
+		{
+			fn: "year",
+		},
+		{
+			fn:    "clamp_max",
+			fArgs: []string{"5"},
+		},
+		{
+			fn:    "clamp_min",
+			fArgs: []string{"5"},
+		},
+		{
+			fn:           "predict_linear",
+			isTestMatrix: true,
+			approximate:  true,
+			fArgs:        []string{"1"},
+		},
+		{
+			fn:    "round",
+			fArgs: []string{"20"},
+		},
+		{
+			fn:           "holt_winters",
+			isTestMatrix: true,
+			fArgs:        []string{"0.5", "0.7"},
+			approximate:  true,
+		},
+	} {
+
+		t.Run(tc.fn, func(t *testing.T) {
+			baseQuery, err := engine.NewRangeQuery(
+				shardAwareQueryable,
+				mkQuery(tpl, tc.fn, tc.isTestMatrix, tc.fArgs),
+				start,
+				end,
+				step,
+			)
+			require.Nil(t, err)
+			shardQuery, err := engine.NewRangeQuery(
+				shardAwareQueryable,
+				mkQuery(shardTpl, tc.fn, tc.isTestMatrix, tc.fArgs),
+				start,
+				end,
+				step,
+			)
+			require.Nil(t, err)
+			baseResult := baseQuery.Exec(ctx)
+			shardResult := shardQuery.Exec(ctx)
+			t.Logf("base: %+v\n", baseResult)
+			t.Logf("shard: %+v\n", shardResult)
+			if !tc.approximate {
+				require.Equal(t, baseResult, shardResult)
+			} else {
+				// Some functions yield tiny differences when sharded due to combining floating point calculations.
+				baseSeries := baseResult.Value.(promql.Matrix)[0]
+				shardSeries := shardResult.Value.(promql.Matrix)[0]
+
+				require.Equal(t, len(baseSeries.Points), len(shardSeries.Points))
+				for i, basePt := range baseSeries.Points {
+					shardPt := shardSeries.Points[i]
+					require.Equal(t, basePt.T, shardPt.T)
+					require.Equal(
+						t,
+						math.Round(basePt.V*1e6)/1e6,
+						math.Round(shardPt.V*1e6)/1e6,
+					)
+				}
+
+			}
+		})
+	}
+
+}
+
+var shardAwareQueryable = storage.QueryableFunc(func(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
+	return &testMatrix{
+		series: []*promql.StorageSeries{
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blop"}, {Name: "foo", Value: "barr"}}, factor(5)),
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blop"}, {Name: "foo", Value: "bazz"}}, factor(7)),
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blap"}, {Name: "foo", Value: "buzz"}}, factor(12)),
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blap"}, {Name: "foo", Value: "bozz"}}, factor(11)),
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blop"}, {Name: "foo", Value: "buzz"}}, factor(8)),
+			newSeries(labels.Labels{{Name: "__name__", Value: "bar1"}, {Name: "baz", Value: "blip"}, {Name: "bar", Value: "blap"}, {Name: "foo", Value: "bazz"}}, identity),
+		},
+	}, nil
+})
+
+type testMatrix struct {
+	series []*promql.StorageSeries
+}
+
+func (m *testMatrix) Copy() *testMatrix {
+	cpy := *m
+	return &cpy
+}
+
+func (m testMatrix) Next() bool { return len(m.series) != 0 }
+
+func (m *testMatrix) At() storage.Series {
+	res := m.series[0]
+	m.series = m.series[1:]
+	return res
+}
+
+func (m *testMatrix) Err() error { return nil }
+
+func (m *testMatrix) Select(selectParams *storage.SelectParams, matchers ...*labels.Matcher) (storage.SeriesSet, storage.Warnings, error) {
+	s, _, err := astmapper.ShardFromMatchers(matchers)
+	if err != nil {
+		return nil, nil, err
+	}
+
+	if s != nil {
+		return splitByShard(s.Shard, s.Of, m), nil, nil
+	}
+
+	return m.Copy(), nil, nil
+}
+
+func (m *testMatrix) LabelValues(name string) ([]string, storage.Warnings, error) {
+	return nil, nil, nil
+}
+func (m *testMatrix) LabelNames() ([]string, storage.Warnings, error) { return nil, nil, nil }
+func (m *testMatrix) Close() error                                    { return nil }
+
+func newSeries(metric labels.Labels, generator func(float64) float64) *promql.StorageSeries {
+	sort.Sort(metric)
+	var points []promql.Point
+
+	for ts := start.Add(-step); ts.Unix() <= end.Unix(); ts = ts.Add(step) {
+		t := ts.Unix() * 1e3
+		points = append(points, promql.Point{
+			T: t,
+			V: generator(float64(t)),
+		})
+	}
+
+	return promql.NewStorageSeries(promql.Series{
+		Metric: metric,
+		Points: points,
+	})
+}
+
+func identity(t float64) float64 {
+	return float64(t)
+}
+
+func factor(f float64) func(float64) float64 {
+	i := 0.
+	return func(float64) float64 {
+		i++
+		res := i * f
+		return res
+	}
+}
+
+// var identity(t int64) float64 {
+// 	return float64(t)
+// }
+
+// splitByShard returns the shard subset of a testMatrix.
+// e.g if a testMatrix has 6 series, and we want 3 shard, then each shard will contain
+// 2 series.
+func splitByShard(shardIndex, shardTotal int, testMatrices *testMatrix) *testMatrix {
+	res := &testMatrix{}
+	for i, s := range testMatrices.series {
+		if i%shardTotal != shardIndex {
+			continue
+		}
+		var points []promql.Point
+		it := s.Iterator()
+		for it.Next() {
+			t, v := it.At()
+			points = append(points, promql.Point{
+				T: t,
+				V: v,
+			})
+
+		}
+		lbs := s.Labels().Copy()
+		lbs = append(lbs, labels.Label{Name: "__cortex_shard__", Value: fmt.Sprintf("%d_of_%d", shardIndex, shardTotal)})
+		res.series = append(res.series, promql.NewStorageSeries(promql.Series{
+			Metric: lbs,
+			Points: points,
+		}))
+	}
+	return res
+}
diff --git a/pkg/querier/queryrange/query_range.go b/pkg/querier/queryrange/query_range.go
index bac9d1d7540..65c206b82cc 100644
--- a/pkg/querier/queryrange/query_range.go
+++ b/pkg/querier/queryrange/query_range.go
@@ -22,7 +22,8 @@ import (
 	"github.com/cortexproject/cortex/pkg/ingester/client"
 )
 
-const statusSuccess = "success"
+// StatusSuccess Prometheus success result.
+const StatusSuccess = "success"
 
 var (
 	matrix            = model.ValMatrix.String()
@@ -71,6 +72,8 @@ type Request interface {
 	GetQuery() string
 	// WithStartEnd clone the current request with different start and end timestamp.
 	WithStartEnd(int64, int64) Request
+	// WithQuery clone the current request with a different query.
+	WithQuery(string) Request
 	proto.Message
 }
 
@@ -100,6 +103,13 @@ func (q *PrometheusRequest) WithStartEnd(start int64, end int64) Request {
 	return &new
 }
 
+// WithQuery clones the current `PrometheusRequest` with a new query.
+func (q *PrometheusRequest) WithQuery(query string) Request {
+	new := *q
+	new.Query = query
+	return &new
+}
+
 type byFirstTime []*PrometheusResponse
 
 func (a byFirstTime) Len() int           { return len(a) }
@@ -127,12 +137,12 @@ func (prometheusCodec) MergeResponse(responses ...Response) (Response, error) {
 
 	if len(promResponses) == 0 {
 		return &PrometheusResponse{
-			Status: statusSuccess,
+			Status: StatusSuccess,
 		}, nil
 	}
 
 	return &PrometheusResponse{
-		Status: statusSuccess,
+		Status: StatusSuccess,
 		Data: PrometheusData{
 			ResultType: model.ValMatrix.String(),
 			Result:     matrixMerge(promResponses),
diff --git a/pkg/querier/queryrange/query_range_test.go b/pkg/querier/queryrange/query_range_test.go
index 7bfd0c1ed94..2e25bcdca30 100644
--- a/pkg/querier/queryrange/query_range_test.go
+++ b/pkg/querier/queryrange/query_range_test.go
@@ -117,7 +117,7 @@ func TestMergeAPIResponses(t *testing.T) {
 		{
 			input: []Response{},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 			},
 		},
 
@@ -132,7 +132,7 @@ func TestMergeAPIResponses(t *testing.T) {
 				},
 			},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 				Data: PrometheusData{
 					ResultType: matrix,
 					Result:     []SampleStream{},
@@ -157,7 +157,7 @@ func TestMergeAPIResponses(t *testing.T) {
 				},
 			},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 				Data: PrometheusData{
 					ResultType: matrix,
 					Result:     []SampleStream{},
@@ -198,7 +198,7 @@ func TestMergeAPIResponses(t *testing.T) {
 				},
 			},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 				Data: PrometheusData{
 					ResultType: matrix,
 					Result: []SampleStream{
@@ -223,7 +223,7 @@ func TestMergeAPIResponses(t *testing.T) {
 				mustParse(t, `{"status":"success","data":{"resultType":"matrix","result":[{"metric":{"c":"d","a":"b"},"values":[[2,"2"],[3,"3"]]}]}}`),
 			},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 				Data: PrometheusData{
 					ResultType: matrix,
 					Result: []SampleStream{
@@ -247,7 +247,7 @@ func TestMergeAPIResponses(t *testing.T) {
 				mustParse(t, `{"status":"success","data":{"resultType":"matrix","result":[{"metric":{"c":"d","a":"b"},"values":[[2,"2"],[3,"3"]]}]}}`),
 			},
 			expected: &PrometheusResponse{
-				Status: statusSuccess,
+				Status: StatusSuccess,
 				Data: PrometheusData{
 					ResultType: matrix,
 					Result: []SampleStream{
diff --git a/pkg/querier/queryrange/queryable.go b/pkg/querier/queryrange/queryable.go
new file mode 100644
index 00000000000..14a2ed7b073
--- /dev/null
+++ b/pkg/querier/queryrange/queryable.go
@@ -0,0 +1,120 @@
+package queryrange
+
+import (
+	"context"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/storage"
+)
+
+const (
+	missingEmbeddedQueryMsg = "missing embedded query"
+	nonEmbeddedErrMsg       = "DownstreamQuerier cannot handle a non-embedded query"
+)
+
+// DownstreamQueryable is an implementor of the Queryable interface.
+type DownstreamQueryable struct {
+	Req     Request
+	Handler Handler
+}
+
+// Querier impls Queryable
+func (q *DownstreamQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
+	return &DownstreamQuerier{ctx, q.Req, q.Handler}, nil
+}
+
+// DownstreamQuerier is a an implementor of the Querier interface.
+type DownstreamQuerier struct {
+	Ctx     context.Context
+	Req     Request
+	Handler Handler
+}
+
+// Select returns a set of series that matches the given label matchers.
+func (q *DownstreamQuerier) Select(
+	_ *storage.SelectParams,
+	matchers ...*labels.Matcher,
+) (storage.SeriesSet, storage.Warnings, error) {
+	var embeddedQuery string
+	var isEmbedded bool
+	for _, matcher := range matchers {
+		if matcher.Name == labels.MetricName && matcher.Value == astmapper.EmbeddedQueryFlag {
+			isEmbedded = true
+		}
+
+		if matcher.Name == astmapper.QueryLabel {
+			embeddedQuery = matcher.Value
+		}
+	}
+
+	if isEmbedded {
+		if embeddedQuery != "" {
+			return q.handleEmbeddedQuery(embeddedQuery)
+		}
+		return nil, nil, errors.Errorf(missingEmbeddedQueryMsg)
+
+	}
+
+	return nil, nil, errors.Errorf(nonEmbeddedErrMsg)
+}
+
+// handleEmbeddedQuery defers execution of an encoded query to a downstream Handler
+func (q *DownstreamQuerier) handleEmbeddedQuery(encoded string) (storage.SeriesSet, storage.Warnings, error) {
+	queries, err := astmapper.JSONCodec.Decode(encoded)
+	if err != nil {
+		return nil, nil, err
+	}
+
+	ctx, cancel := context.WithCancel(q.Ctx)
+	defer cancel()
+
+	// buffer channels to length of queries to prevent leaking memory due to sending to unbuffered channels after cancel/err
+	errCh := make(chan error, len(queries))
+	samplesCh := make(chan []SampleStream, len(queries))
+	// TODO(owen-d): impl unified concurrency controls, not per middleware
+	for _, query := range queries {
+		go func(query string) {
+			resp, err := q.Handler.Do(ctx, q.Req.WithQuery(query))
+			if err != nil {
+				errCh <- err
+				return
+			}
+			streams, err := ResponseToSamples(resp)
+			if err != nil {
+				errCh <- err
+				return
+			}
+			samplesCh <- streams
+		}(query)
+	}
+
+	var samples []SampleStream
+
+	for i := 0; i < len(queries); i++ {
+		select {
+		case err := <-errCh:
+			return nil, nil, err
+		case streams := <-samplesCh:
+			samples = append(samples, streams...)
+		}
+	}
+
+	return NewSeriesSet(samples), nil, err
+}
+
+// LabelValues returns all potential values for a label name.
+func (q *DownstreamQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
+	return nil, nil, errors.Errorf("unimplemented")
+}
+
+// LabelNames returns all the unique label names present in the block in sorted order.
+func (q *DownstreamQuerier) LabelNames() ([]string, storage.Warnings, error) {
+	return nil, nil, errors.Errorf("unimplemented")
+}
+
+// Close releases the resources of the Querier.
+func (q *DownstreamQuerier) Close() error {
+	return nil
+}
diff --git a/pkg/querier/queryrange/queryable_test.go b/pkg/querier/queryrange/queryable_test.go
new file mode 100644
index 00000000000..d056bc37dca
--- /dev/null
+++ b/pkg/querier/queryrange/queryable_test.go
@@ -0,0 +1,260 @@
+package queryrange
+
+import (
+	"context"
+	"testing"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestSelect(t *testing.T) {
+	var testExpr = []struct {
+		name    string
+		querier *DownstreamQuerier
+		fn      func(*testing.T, *DownstreamQuerier)
+	}{
+		{
+			name: "errors non embedded query",
+			querier: mkQuerier(
+				nil,
+			),
+			fn: func(t *testing.T, q *DownstreamQuerier) {
+				set, _, err := q.Select(nil)
+				require.Nil(t, set)
+				require.EqualError(t, err, nonEmbeddedErrMsg)
+			},
+		},
+		{
+			name: "replaces query",
+			querier: mkQuerier(mockHandler(
+				&PrometheusResponse{},
+				nil,
+			)),
+			fn: func(t *testing.T, q *DownstreamQuerier) {
+
+				expected := &PrometheusResponse{
+					Status: "success",
+					Data: PrometheusData{
+						ResultType: promql.ValueTypeVector,
+					},
+				}
+
+				// override handler func to assert new query has been substituted
+				q.Handler = HandlerFunc(
+					func(ctx context.Context, req Request) (Response, error) {
+						require.Equal(t, `http_requests_total{cluster="prod"}`, req.GetQuery())
+						return expected, nil
+					},
+				)
+
+				_, _, err := q.Select(
+					nil,
+					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
+					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+				)
+				require.Nil(t, err)
+			},
+		},
+		{
+			name: "propagates response error",
+			querier: mkQuerier(mockHandler(
+				&PrometheusResponse{
+					Error: "SomeErr",
+				},
+				nil,
+			)),
+			fn: func(t *testing.T, q *DownstreamQuerier) {
+				set, _, err := q.Select(
+					nil,
+					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
+					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+				)
+				require.Nil(t, set)
+				require.EqualError(t, err, "SomeErr")
+			},
+		},
+		{
+			name: "returns SeriesSet",
+			querier: mkQuerier(mockHandler(
+				&PrometheusResponse{
+					Data: PrometheusData{
+						ResultType: promql.ValueTypeVector,
+						Result: []SampleStream{
+							{
+								Labels: []client.LabelAdapter{
+									{Name: "a", Value: "a1"},
+									{Name: "b", Value: "b1"},
+								},
+								Samples: []client.Sample{
+									{
+										Value:       1,
+										TimestampMs: 1,
+									},
+									{
+										Value:       2,
+										TimestampMs: 2,
+									},
+								},
+							},
+							{
+								Labels: []client.LabelAdapter{
+									{Name: "a", Value: "a1"},
+									{Name: "b", Value: "b1"},
+								},
+								Samples: []client.Sample{
+									{
+										Value:       8,
+										TimestampMs: 1,
+									},
+									{
+										Value:       9,
+										TimestampMs: 2,
+									},
+								},
+							},
+						},
+					},
+				},
+				nil,
+			)),
+			fn: func(t *testing.T, q *DownstreamQuerier) {
+				set, _, err := q.Select(
+					nil,
+					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
+					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+				)
+				require.Nil(t, err)
+				require.Equal(
+					t,
+					NewSeriesSet([]SampleStream{
+						{
+							Labels: []client.LabelAdapter{
+								{Name: "a", Value: "a1"},
+								{Name: "b", Value: "b1"},
+							},
+							Samples: []client.Sample{
+								{
+									Value:       1,
+									TimestampMs: 1,
+								},
+								{
+									Value:       2,
+									TimestampMs: 2,
+								},
+							},
+						},
+						{
+							Labels: []client.LabelAdapter{
+								{Name: "a", Value: "a1"},
+								{Name: "b", Value: "b1"},
+							},
+							Samples: []client.Sample{
+								{
+									Value:       8,
+									TimestampMs: 1,
+								},
+								{
+									Value:       9,
+									TimestampMs: 2,
+								},
+							},
+						},
+					}),
+					set,
+				)
+			},
+		},
+	}
+
+	for _, c := range testExpr {
+		t.Run(c.name, func(t *testing.T) {
+			c.fn(t, c.querier)
+		})
+	}
+}
+
+func TestSelectConcurrent(t *testing.T) {
+	for _, c := range []struct {
+		name    string
+		queries []string
+		err     error
+	}{
+		{
+			name: "concats queries",
+			queries: []string{
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m]))`,
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m]))`,
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))`,
+			},
+			err: nil,
+		},
+		{
+			name: "errors",
+			queries: []string{
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="0_of_3",baz="blip"}[1m]))`,
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="1_of_3",baz="blip"}[1m]))`,
+				`sum by(__cortex_shard__) (rate(bar1{__cortex_shard__="2_of_3",baz="blip"}[1m]))`,
+			},
+			err: errors.Errorf("some-err"),
+		},
+	} {
+
+		t.Run(c.name, func(t *testing.T) {
+			// each request will return a single samplestream
+			querier := mkQuerier(mockHandler(&PrometheusResponse{
+				Data: PrometheusData{
+					ResultType: promql.ValueTypeVector,
+					Result: []SampleStream{
+						{
+							Labels: []client.LabelAdapter{
+								{Name: "a", Value: "1"},
+							},
+							Samples: []client.Sample{
+								{
+									Value:       1,
+									TimestampMs: 1,
+								},
+							},
+						},
+					},
+				},
+			}, c.err))
+
+			set, _, err := querier.Select(
+				nil,
+				exactMatch("__name__", astmapper.EmbeddedQueryFlag),
+				exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode(c.queries)),
+			)
+
+			if c.err != nil {
+				require.EqualError(t, err, c.err.Error())
+				return
+			}
+
+			var ct int
+			for set.Next() {
+				ct++
+			}
+			require.Equal(t, len(c.queries), ct)
+
+		})
+	}
+}
+
+func exactMatch(k, v string) *labels.Matcher {
+	m, err := labels.NewMatcher(labels.MatchEqual, k, v)
+	if err != nil {
+		panic(err)
+	}
+	return m
+
+}
+
+func mkQuerier(handler Handler) *DownstreamQuerier {
+	return &DownstreamQuerier{context.Background(), &PrometheusRequest{}, handler}
+}
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
new file mode 100644
index 00000000000..37db16b8a63
--- /dev/null
+++ b/pkg/querier/queryrange/querysharding.go
@@ -0,0 +1,311 @@
+package queryrange
+
+import (
+	"context"
+	fmt "fmt"
+	"time"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/querier/lazyquery"
+	"github.com/go-kit/kit/log"
+	"github.com/go-kit/kit/log/level"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
+)
+
+var (
+	nanosecondsInMillisecond = int64(time.Millisecond / time.Nanosecond)
+
+	errInvalidShardingRange = errors.New("Query does not fit in a single sharding configuration")
+)
+
+// ShardingConfigs is a slice of chunk shard configs
+type ShardingConfigs []chunk.PeriodConfig
+
+// ValidRange extracts a non-overlapping sharding configuration from a list of configs and a time range.
+func (confs ShardingConfigs) ValidRange(start, end int64) (chunk.PeriodConfig, error) {
+	for i, conf := range confs {
+		if start < int64(conf.From.Time) {
+			// the query starts before this config's range
+			return chunk.PeriodConfig{}, errInvalidShardingRange
+		} else if i == len(confs)-1 {
+			// the last configuration has no upper bound
+			return conf, nil
+		} else if end < int64(confs[i+1].From.Time) {
+			// The request is entirely scoped into this shard config
+			return conf, nil
+		} else {
+			continue
+		}
+	}
+
+	return chunk.PeriodConfig{}, errInvalidShardingRange
+}
+
+func (confs ShardingConfigs) hasShards() bool {
+	for _, conf := range confs {
+		if conf.RowShards > 0 {
+			return true
+		}
+	}
+	return false
+}
+
+func mapQuery(mapper astmapper.ASTMapper, query string) (promql.Node, error) {
+	expr, err := promql.ParseExpr(query)
+	if err != nil {
+		return nil, err
+	}
+	return mapper.Map(expr)
+}
+
+// NewQueryShardMiddleware creates a middleware which downstreams queries after AST mapping and query encoding.
+func NewQueryShardMiddleware(
+	logger log.Logger,
+	engine *promql.Engine,
+	confs ShardingConfigs,
+	codec Codec,
+	minShardingLookback time.Duration,
+) Middleware {
+	passthrough := MiddlewareFunc(func(next Handler) Handler {
+		return next
+	})
+
+	noshards := !confs.hasShards()
+
+	if noshards {
+		level.Warn(logger).Log(
+			"middleware", "QueryShard",
+			"msg", "no configuration with shard found",
+			"confs", fmt.Sprintf("%+v", confs),
+		)
+		return passthrough
+	}
+
+	getConf := func(r Request) (chunk.PeriodConfig, error) {
+		conf, err := confs.ValidRange(r.GetStart(), r.GetEnd())
+
+		// query exists across multiple sharding configs
+		if err != nil {
+			return conf, err
+		}
+
+		// query doesn't have shard factor, so don't try to do AST mapping.
+		if conf.RowShards < 2 {
+			return conf, errors.Errorf("shard factor not high enough: [%d]", conf.RowShards)
+		}
+
+		return conf, nil
+	}
+
+	mapperware := MiddlewareFunc(func(next Handler) Handler {
+		return &astMapperware{
+			getConf: getConf,
+			logger:  log.With(logger, "middleware", "QueryShard.astMapperware"),
+			next:    next,
+		}
+	})
+
+	shardingware := MiddlewareFunc(func(next Handler) Handler {
+		return &queryShard{
+			getConf: getConf,
+			next:    next,
+			engine:  engine,
+		}
+	})
+
+	return MiddlewareFunc(func(next Handler) Handler {
+		return &shardSplitter{
+			codec:               codec,
+			MinShardingLookback: minShardingLookback,
+			shardingware: MergeMiddlewares(
+				InstrumentMiddleware("shardingware"),
+				mapperware,
+				shardingware,
+			).Wrap(next),
+			now:  time.Now,
+			next: InstrumentMiddleware("sharding-bypass").Wrap(next),
+		}
+	})
+
+}
+
+type astMapperware struct {
+	getConf func(Request) (chunk.PeriodConfig, error)
+	logger  log.Logger
+	next    Handler
+}
+
+func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
+	conf, err := ast.getConf(r)
+	// cannot shard with this timerange
+	if err != nil {
+		level.Warn(ast.logger).Log("err", err.Error())
+		return ast.next.Do(ctx, r)
+	}
+
+	shardSummer, err := astmapper.NewShardSummer(int(conf.RowShards), astmapper.VectorSquasher)
+	if err != nil {
+		return nil, err
+	}
+
+	subtreeFolder, err := astmapper.NewSubtreeFolder(astmapper.JSONCodec)
+	if err != nil {
+		return nil, err
+	}
+
+	strQuery := r.GetQuery()
+	mappedQuery, err := mapQuery(
+		astmapper.NewMultiMapper(
+			shardSummer,
+			subtreeFolder,
+		),
+		strQuery,
+	)
+
+	if err != nil {
+		return nil, err
+	}
+
+	strMappedQuery := mappedQuery.String()
+	level.Debug(ast.logger).Log("msg", "mapped query", "original", strQuery, "mapped", strMappedQuery)
+
+	return ast.next.Do(ctx, r.WithQuery(strMappedQuery))
+
+}
+
+type queryShard struct {
+	getConf func(Request) (chunk.PeriodConfig, error)
+	next    Handler
+	engine  *promql.Engine
+}
+
+func (qs *queryShard) Do(ctx context.Context, r Request) (Response, error) {
+	// since there's no available sharding configuration for this time range,
+	// no astmapping has been performed, so skip this middleware.
+	if _, err := qs.getConf(r); err != nil {
+		return qs.next.Do(ctx, r)
+	}
+
+	queryable := lazyquery.NewLazyQueryable(&DownstreamQueryable{r, qs.next})
+
+	qry, err := qs.engine.NewRangeQuery(
+		queryable,
+		r.GetQuery(),
+		TimeFromMillis(r.GetStart()),
+		TimeFromMillis(r.GetEnd()),
+		time.Duration(r.GetStep())*time.Millisecond,
+	)
+
+	if err != nil {
+		return nil, err
+	}
+	res := qry.Exec(ctx)
+	extracted, err := FromResult(res)
+	if err != nil {
+		return nil, err
+
+	}
+	return &PrometheusResponse{
+		Status: StatusSuccess,
+		Data: PrometheusData{
+			ResultType: string(res.Value.Type()),
+			Result:     extracted,
+		},
+	}, nil
+}
+
+// shardSplitter middleware will only shard appropriate requests that do not extend past the MinShardingLookback interval.
+// This is used to send nonsharded requests to the ingesters in order to not overload them.
+type shardSplitter struct {
+	codec               Codec
+	MinShardingLookback time.Duration    // delimiter for splitting sharded vs non-sharded queries
+	shardingware        Handler          // handler for sharded queries
+	next                Handler          // handler for non-sharded queries
+	now                 func() time.Time // injectable time.Now
+}
+
+func (splitter *shardSplitter) Do(ctx context.Context, r Request) (Response, error) {
+	cutoff := splitter.now().Add(-splitter.MinShardingLookback)
+	sharded, nonsharded := partitionRequest(r, cutoff)
+
+	return splitter.parallel(ctx, sharded, nonsharded)
+
+}
+
+func (splitter *shardSplitter) parallel(ctx context.Context, sharded, nonsharded Request) (Response, error) {
+	if sharded == nil {
+		return splitter.next.Do(ctx, nonsharded)
+	}
+
+	if nonsharded == nil {
+		return splitter.shardingware.Do(ctx, sharded)
+	}
+
+	nonshardCh := make(chan Response, 1)
+	shardCh := make(chan Response, 1)
+	errCh := make(chan error, 2)
+
+	go func() {
+		res, err := splitter.next.Do(ctx, nonsharded)
+		if err != nil {
+			errCh <- err
+			return
+		}
+		nonshardCh <- res
+
+	}()
+
+	go func() {
+		res, err := splitter.shardingware.Do(ctx, sharded)
+		if err != nil {
+			errCh <- err
+			return
+		}
+		shardCh <- res
+	}()
+
+	resps := make([]Response, 0, 2)
+	for i := 0; i < 2; i++ {
+		select {
+		case r := <-nonshardCh:
+			resps = append(resps, r)
+		case r := <-shardCh:
+			resps = append(resps, r)
+		case err := <-errCh:
+			return nil, err
+		case <-ctx.Done():
+			return nil, ctx.Err()
+		}
+
+	}
+
+	return splitter.codec.MergeResponse(resps...)
+}
+
+// partitionQuery splits a request into potentially multiple requests, one including the request's time range
+// [0,t). The other will include [t,inf)
+func partitionRequest(r Request, t time.Time) (before Request, after Request) {
+	boundary := TimeToMillis(t)
+	if r.GetStart() >= boundary {
+		return nil, r
+	}
+
+	if r.GetEnd() < boundary {
+		return r, nil
+	}
+
+	return r.WithStartEnd(r.GetStart(), boundary), r.WithStartEnd(boundary, r.GetEnd())
+}
+
+// TimeFromMillis is a helper to turn milliseconds -> time.Time
+func TimeFromMillis(ms int64) time.Time {
+	secs := ms / 1000
+	rem := ms - (secs * 1000)
+	return time.Unix(secs, rem*nanosecondsInMillisecond)
+}
+
+func TimeToMillis(t time.Time) int64 {
+	return t.UnixNano() / nanosecondsInMillisecond
+}
diff --git a/pkg/querier/queryrange/querysharding_test.go b/pkg/querier/queryrange/querysharding_test.go
new file mode 100644
index 00000000000..90d2b176c10
--- /dev/null
+++ b/pkg/querier/queryrange/querysharding_test.go
@@ -0,0 +1,633 @@
+package queryrange
+
+import (
+	"context"
+	"fmt"
+	"math"
+	"runtime"
+	"testing"
+	"time"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/util"
+	"github.com/go-kit/kit/log"
+	"github.com/pkg/errors"
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/prometheus/prometheus/storage"
+	"github.com/stretchr/testify/require"
+)
+
+func TestQueryshardingMiddleware(t *testing.T) {
+	var testExpr = []struct {
+		name     string
+		next     Handler
+		input    Request
+		ctx      context.Context
+		expected *PrometheusResponse
+		err      bool
+		override func(*testing.T, Handler)
+	}{
+		{
+			name: "invalid query error",
+			// if the query parses correctly force it to succeed
+			next: mockHandler(&PrometheusResponse{
+				Status: "",
+				Data: PrometheusData{
+					ResultType: promql.ValueTypeVector,
+					Result:     []SampleStream{},
+				},
+				ErrorType: "",
+				Error:     "",
+			}, nil),
+			input:    &PrometheusRequest{Query: "^GARBAGE"},
+			ctx:      context.Background(),
+			expected: nil,
+			err:      true,
+		},
+		{
+			name:     "downstream err",
+			next:     mockHandler(nil, errors.Errorf("some err")),
+			input:    defaultReq(),
+			ctx:      context.Background(),
+			expected: nil,
+			err:      true,
+		},
+		{
+			name: "successful trip",
+			next: mockHandler(sampleMatrixResponse(), nil),
+			override: func(t *testing.T, handler Handler) {
+
+				// pre-encode the query so it doesn't try to re-split. We're just testing if it passes through correctly
+				qry := defaultReq().WithQuery(
+					`__embedded_queries__{__cortex_queries__="{\"Concat\":[\"http_requests_total{cluster=\\\"prod\\\"}\"]}"}`,
+				)
+				out, err := handler.Do(context.Background(), qry)
+				require.Nil(t, err)
+				require.Equal(t, promql.ValueTypeMatrix, out.(*PrometheusResponse).Data.ResultType)
+				require.Equal(t, sampleMatrixResponse(), out)
+			},
+		},
+	}
+
+	for _, c := range testExpr {
+		t.Run(c.name, func(t *testing.T) {
+			engine := promql.NewEngine(promql.EngineOpts{
+				Logger:        util.Logger,
+				Reg:           nil,
+				MaxConcurrent: 10,
+				MaxSamples:    1000,
+				Timeout:       time.Minute,
+			})
+
+			handler := NewQueryShardMiddleware(
+				log.NewNopLogger(),
+				engine,
+				ShardingConfigs{
+					{
+						RowShards: 3,
+					},
+				},
+				PrometheusCodec,
+				0,
+			).Wrap(c.next)
+
+			// escape hatch for custom tests
+			if c.override != nil {
+				c.override(t, handler)
+				return
+			}
+
+			out, err := handler.Do(c.ctx, c.input)
+
+			if c.err {
+				require.NotNil(t, err)
+			} else {
+				require.Nil(t, err)
+				require.Equal(t, c.expected, out)
+			}
+
+		})
+	}
+}
+
+func sampleMatrixResponse() *PrometheusResponse {
+	return &PrometheusResponse{
+		Status: StatusSuccess,
+		Data: PrometheusData{
+			ResultType: promql.ValueTypeMatrix,
+			Result: []SampleStream{
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							TimestampMs: 5,
+							Value:       1,
+						},
+						{
+							TimestampMs: 10,
+							Value:       2,
+						},
+					},
+				},
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							TimestampMs: 5,
+							Value:       8,
+						},
+						{
+							TimestampMs: 10,
+							Value:       9,
+						},
+					},
+				},
+			},
+		},
+	}
+}
+
+func mockHandler(resp *PrometheusResponse, err error) Handler {
+	return HandlerFunc(func(ctx context.Context, req Request) (Response, error) {
+		if expired := ctx.Err(); expired != nil {
+			return nil, expired
+		}
+
+		return resp, err
+	})
+}
+
+func defaultReq() *PrometheusRequest {
+	return &PrometheusRequest{
+		Path:    "/query_range",
+		Start:   00,
+		End:     10,
+		Step:    5,
+		Timeout: time.Minute,
+		Query:   `sum(rate(http_requests_total{}[5m]))`,
+	}
+}
+
+func TestShardingConfigs_ValidRange(t *testing.T) {
+	reqWith := func(start, end string) *PrometheusRequest {
+		r := defaultReq()
+
+		if start != "" {
+			r.Start = int64(parseDate(start))
+		}
+
+		if end != "" {
+			r.End = int64(parseDate(end))
+		}
+
+		return r
+	}
+
+	var testExpr = []struct {
+		name     string
+		confs    ShardingConfigs
+		req      *PrometheusRequest
+		expected chunk.PeriodConfig
+		err      error
+	}{
+		{
+			name:  "0 ln configs fail",
+			confs: ShardingConfigs{},
+			req:   defaultReq(),
+			err:   errInvalidShardingRange,
+		},
+		{
+			name: "request starts before beginning config",
+			confs: ShardingConfigs{
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-10-16")},
+					RowShards: 1,
+				},
+			},
+			req: reqWith("2019-10-15", ""),
+			err: errInvalidShardingRange,
+		},
+		{
+			name: "request spans multiple configs",
+			confs: ShardingConfigs{
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-10-16")},
+					RowShards: 1,
+				},
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-11-16")},
+					RowShards: 2,
+				},
+			},
+			req: reqWith("2019-10-15", "2019-11-17"),
+			err: errInvalidShardingRange,
+		},
+		{
+			name: "selects correct config ",
+			confs: ShardingConfigs{
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-10-16")},
+					RowShards: 1,
+				},
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-11-16")},
+					RowShards: 2,
+				},
+				{
+					From:      chunk.DayTime{Time: parseDate("2019-12-16")},
+					RowShards: 3,
+				},
+			},
+			req: reqWith("2019-11-20", "2019-11-25"),
+			expected: chunk.PeriodConfig{
+				From:      chunk.DayTime{Time: parseDate("2019-11-16")},
+				RowShards: 2,
+			},
+		},
+	}
+
+	for _, c := range testExpr {
+		t.Run(c.name, func(t *testing.T) {
+			out, err := c.confs.ValidRange(c.req.Start, c.req.End)
+
+			if c.err != nil {
+				require.EqualError(t, err, c.err.Error())
+			} else {
+				require.Nil(t, err)
+				require.Equal(t, c.expected, out)
+			}
+		})
+	}
+}
+
+func TestTimeFromMillis(t *testing.T) {
+	var testExpr = []struct {
+		input    int64
+		expected time.Time
+	}{
+		{input: 1000, expected: time.Unix(1, 0)},
+		{input: 1500, expected: time.Unix(1, 500*nanosecondsInMillisecond)},
+	}
+
+	for i, c := range testExpr {
+		t.Run(string(i), func(t *testing.T) {
+			res := TimeFromMillis(c.input)
+			require.Equal(t, c.expected, res)
+		})
+	}
+}
+
+func parseDate(in string) model.Time {
+	t, err := time.Parse("2006-01-02", in)
+	if err != nil {
+		panic(err)
+	}
+	return model.Time(t.UnixNano())
+}
+
+// mappingValidator can be injected into a middleware chain to assert that a query matches an expected query
+type mappingValidator struct {
+	expected string
+	next     Handler
+}
+
+func (v *mappingValidator) Do(ctx context.Context, req Request) (Response, error) {
+	expr, err := promql.ParseExpr(req.GetQuery())
+	if err != nil {
+		return nil, err
+	}
+
+	if v.expected != expr.String() {
+		return nil, errors.Errorf("bad query mapping: expected [%s], got [%s]", v.expected, expr.String())
+	}
+
+	return v.next.Do(ctx, req)
+}
+
+// approximatelyEquals ensures two responses are approximately equal, up to 6 decimals precision per sample
+func approximatelyEquals(t *testing.T, a, b *PrometheusResponse) {
+	require.Equal(t, a.Status, b.Status)
+	if a.Status != StatusSuccess {
+		return
+	}
+	as, err := ResponseToSamples(a)
+	require.Nil(t, err)
+	bs, err := ResponseToSamples(b)
+	require.Nil(t, err)
+
+	require.Equal(t, len(as), len(bs))
+
+	for i := 0; i < len(as); i++ {
+		a := as[i]
+		b := bs[i]
+		require.Equal(t, a.Labels, b.Labels)
+		require.Equal(t, len(a.Samples), len(b.Samples))
+
+		for j := 0; j < len(a.Samples); j++ {
+			aSample := &a.Samples[j]
+			aSample.Value = math.Round(aSample.Value*1e6) / 1e6
+			bSample := &b.Samples[j]
+			bSample.Value = math.Round(bSample.Value*1e6) / 1e6
+		}
+		require.Equal(t, a, b)
+	}
+}
+
+func TestQueryshardingCorrectness(t *testing.T) {
+	shardFactor := 2
+	req := &PrometheusRequest{
+		Path:  "/query_range",
+		Start: start.UnixNano() / nanosecondsInMillisecond,
+		End:   end.UnixNano() / nanosecondsInMillisecond,
+		Step:  int64(step) / int64(time.Second),
+	}
+	for _, tc := range []struct {
+		desc   string
+		query  string
+		mapped string
+	}{
+		{
+			desc:   "fully encoded histogram_quantile",
+			query:  `histogram_quantile(0.5, rate(bar1{baz="blip"}[30s]))`,
+			mapped: `__embedded_queries__{__cortex_queries__="{\"Concat\":[\"histogram_quantile(0.5, rate(bar1{baz=\\\"blip\\\"}[30s]))\"]}"}`,
+		},
+		{
+			desc:   "entire query with shard summer",
+			query:  `sum by (foo,bar) (min_over_time(bar1{baz="blip"}[1m]))`,
+			mapped: `sum by(foo, bar) (__embedded_queries__{__cortex_queries__="{\"Concat\":[\"sum by(foo, bar, __cortex_shard__) (min_over_time(bar1{__cortex_shard__=\\\"0_of_2\\\",baz=\\\"blip\\\"}[1m]))\",\"sum by(foo, bar, __cortex_shard__) (min_over_time(bar1{__cortex_shard__=\\\"1_of_2\\\",baz=\\\"blip\\\"}[1m]))\"]}"})`,
+		},
+		{
+			desc:   "shard one leg encode the other",
+			query:  "sum(rate(bar1[1m])) or rate(bar1[1m])",
+			mapped: `sum without(__cortex_shard__) (__embedded_queries__{__cortex_queries__="{\"Concat\":[\"sum by(__cortex_shard__) (rate(bar1{__cortex_shard__=\\\"0_of_2\\\"}[1m]))\",\"sum by(__cortex_shard__) (rate(bar1{__cortex_shard__=\\\"1_of_2\\\"}[1m]))\"]}"}) or __embedded_queries__{__cortex_queries__="{\"Concat\":[\"rate(bar1[1m])\"]}"}`,
+		},
+		{
+			desc:   "should skip encoding leaf scalar/strings",
+			query:  `histogram_quantile(0.5, sum(rate(cortex_cache_value_size_bytes_bucket[5m])) by (le))`,
+			mapped: `histogram_quantile(0.5, sum by(le) (__embedded_queries__{__cortex_queries__="{\"Concat\":[\"sum by(le, __cortex_shard__) (rate(cortex_cache_value_size_bytes_bucket{__cortex_shard__=\\\"0_of_2\\\"}[5m]))\",\"sum by(le, __cortex_shard__) (rate(cortex_cache_value_size_bytes_bucket{__cortex_shard__=\\\"1_of_2\\\"}[5m]))\"]}"}))`,
+		},
+	} {
+		t.Run(tc.desc, func(t *testing.T) {
+			shardingConf := ShardingConfigs{
+				chunk.PeriodConfig{
+					Schema:    "v10",
+					RowShards: uint32(shardFactor),
+				},
+			}
+			shardingware := NewQueryShardMiddleware(
+				log.NewNopLogger(),
+				engine,
+				// ensure that all requests are shard compatbile
+				shardingConf,
+				PrometheusCodec,
+				0,
+			)
+
+			downstream := &downstreamHandler{
+				engine:    engine,
+				queryable: shardAwareQueryable,
+			}
+
+			assertionMWare := MiddlewareFunc(func(next Handler) Handler {
+				return &mappingValidator{
+					expected: tc.mapped,
+					next:     next,
+				}
+			})
+
+			mapperware := MiddlewareFunc(func(next Handler) Handler {
+				return &astMapperware{
+					getConf: func(_ Request) (chunk.PeriodConfig, error) {
+						return shardingConf[0], nil
+					},
+					logger: log.NewNopLogger(),
+					next:   next,
+				}
+			})
+
+			r := req.WithQuery(tc.query)
+
+			// ensure the expected ast mapping occurs
+			_, err := MergeMiddlewares(mapperware, assertionMWare).Wrap(downstream).Do(context.Background(), r)
+			require.Nil(t, err)
+
+			shardedRes, err := shardingware.Wrap(downstream).Do(context.Background(), r)
+			require.Nil(t, err)
+
+			res, err := downstream.Do(context.Background(), r)
+			require.Nil(t, err)
+
+			approximatelyEquals(t, res.(*PrometheusResponse), shardedRes.(*PrometheusResponse))
+		})
+	}
+}
+
+func TestShardSplitting(t *testing.T) {
+
+	req := &PrometheusRequest{
+		Path:  "/query_range",
+		Start: start.UnixNano() / nanosecondsInMillisecond,
+		End:   end.UnixNano() / nanosecondsInMillisecond,
+		Step:  int64(step) / int64(time.Second),
+		Query: "sum(rate(bar1[1m]))",
+	}
+
+	shardingware := NewQueryShardMiddleware(
+		log.NewNopLogger(),
+		engine,
+		// ensure that all requests are shard compatbile
+		ShardingConfigs{
+			chunk.PeriodConfig{
+				Schema:    "v10",
+				RowShards: uint32(2),
+			},
+		},
+		PrometheusCodec,
+		end.Sub(start)/2, // shard 1/2 of the req
+	)
+
+	downstream := &downstreamHandler{
+		engine:    engine,
+		queryable: shardAwareQueryable,
+	}
+
+	handler := shardingware.Wrap(downstream).(*shardSplitter)
+	handler.now = func() time.Time { return end } // make the split cut the request in half (don't use time.Now)
+
+	resp, err := handler.Do(context.Background(), req)
+	require.Nil(t, err)
+
+	unaltered, err := downstream.Do(context.Background(), req)
+	require.Nil(t, err)
+
+	approximatelyEquals(t, unaltered.(*PrometheusResponse), resp.(*PrometheusResponse))
+}
+
+func BenchmarkQuerySharding(b *testing.B) {
+
+	var shards []uint32
+
+	// max out at half available cpu cores in order to minimize noisy neighbor issues while benchmarking
+	for shard := 1; shard <= runtime.NumCPU()/2; shard = shard * 2 {
+		shards = append(shards, uint32(shard))
+	}
+
+	for _, tc := range []struct {
+		labelBuckets     int
+		labels           []string
+		samplesPerSeries int
+		query            string
+		desc             string
+	}{
+		// Ensure you have enough cores to run these tests without blocking.
+		// We want to simulate parallel computations and waiting in queue doesn't help
+
+		// no-group
+		{
+			labelBuckets:     16,
+			labels:           []string{"a", "b", "c"},
+			samplesPerSeries: 100,
+			query:            `sum(rate(http_requests_total[5m]))`,
+			desc:             "sum nogroup",
+		},
+		// sum by
+		{
+			labelBuckets:     16,
+			labels:           []string{"a", "b", "c"},
+			samplesPerSeries: 100,
+			query:            `sum by(a) (rate(http_requests_total[5m]))`,
+			desc:             "sum by",
+		},
+		// sum without
+		{
+			labelBuckets:     16,
+			labels:           []string{"a", "b", "c"},
+			samplesPerSeries: 100,
+			query:            `sum without (a) (rate(http_requests_total[5m]))`,
+			desc:             "sum without",
+		},
+	} {
+		for _, delayPerSeries := range []time.Duration{
+			0,
+			time.Millisecond / 10,
+		} {
+			engine := promql.NewEngine(promql.EngineOpts{
+				Logger: util.Logger,
+				Reg:    nil,
+				// set high concurrency so we're not bottlenecked here
+				MaxConcurrent: 100000,
+				MaxSamples:    100000000,
+				Timeout:       time.Minute,
+			})
+
+			queryable := NewMockShardedQueryable(
+				tc.samplesPerSeries,
+				tc.labels,
+				tc.labelBuckets,
+				delayPerSeries,
+			)
+			downstream := &downstreamHandler{
+				engine:    engine,
+				queryable: queryable,
+			}
+
+			var (
+				start int64 = 0
+				end         = int64(1000 * tc.samplesPerSeries)
+				step        = (end - start) / 1000
+			)
+
+			req := &PrometheusRequest{
+				Path:    "/query_range",
+				Start:   start,
+				End:     end,
+				Step:    step,
+				Timeout: time.Minute,
+				Query:   tc.query,
+			}
+
+			for _, shardFactor := range shards {
+				shardingware := NewQueryShardMiddleware(
+					log.NewNopLogger(),
+					engine,
+					// ensure that all requests are shard compatbile
+					ShardingConfigs{
+						chunk.PeriodConfig{
+							Schema:    "v10",
+							RowShards: shardFactor,
+						},
+					},
+					PrometheusCodec,
+					0,
+				).Wrap(downstream)
+
+				b.Run(
+					fmt.Sprintf(
+						"desc:[%s]---shards:[%d]---series:[%.0f]---delayPerSeries:[%s]---samplesPerSeries:[%d]",
+						tc.desc,
+						shardFactor,
+						math.Pow(float64(tc.labelBuckets), float64(len(tc.labels))),
+						delayPerSeries,
+						tc.samplesPerSeries,
+					),
+					func(b *testing.B) {
+						for n := 0; n < b.N; n++ {
+							_, err := shardingware.Do(
+								context.Background(),
+								req,
+							)
+							if err != nil {
+								b.Fatal(err.Error())
+							}
+						}
+					},
+				)
+			}
+			fmt.Println()
+		}
+
+		fmt.Print("--------------------------------\n\n")
+	}
+}
+
+type downstreamHandler struct {
+	engine    *promql.Engine
+	queryable storage.Queryable
+}
+
+func (h *downstreamHandler) Do(ctx context.Context, r Request) (Response, error) {
+	qry, err := h.engine.NewRangeQuery(
+		h.queryable,
+		r.GetQuery(),
+		TimeFromMillis(r.GetStart()),
+		TimeFromMillis(r.GetEnd()),
+		time.Duration(r.GetStep())*time.Millisecond,
+	)
+
+	if err != nil {
+		return nil, err
+	}
+
+	res := qry.Exec(ctx)
+	extracted, err := FromResult(res)
+	if err != nil {
+		return nil, err
+
+	}
+
+	return &PrometheusResponse{
+		Status: StatusSuccess,
+		Data: PrometheusData{
+			ResultType: string(res.Value.Type()),
+			Result:     extracted,
+		},
+	}, nil
+}
diff --git a/pkg/querier/queryrange/results_cache.go b/pkg/querier/queryrange/results_cache.go
index 7bcbedebe4d..6076a978177 100644
--- a/pkg/querier/queryrange/results_cache.go
+++ b/pkg/querier/queryrange/results_cache.go
@@ -76,7 +76,7 @@ func (t constSplitter) GenerateCacheKey(userID string, r Request) string {
 var PrometheusResponseExtractor = ExtractorFunc(func(start, end int64, from Response) Response {
 	promRes := from.(*PrometheusResponse)
 	return &PrometheusResponse{
-		Status: statusSuccess,
+		Status: StatusSuccess,
 		Data: PrometheusData{
 			ResultType: promRes.Data.ResultType,
 			Result:     extractMatrix(start, end, promRes.Data.Result),
diff --git a/pkg/querier/queryrange/results_cache_test.go b/pkg/querier/queryrange/results_cache_test.go
index 59020aa7c3f..d38bb84340d 100644
--- a/pkg/querier/queryrange/results_cache_test.go
+++ b/pkg/querier/queryrange/results_cache_test.go
@@ -58,7 +58,7 @@ var (
 )
 
 var dummyResponse = &PrometheusResponse{
-	Status: statusSuccess,
+	Status: StatusSuccess,
 	Data: PrometheusData{
 		ResultType: matrix,
 		Result: []SampleStream{
@@ -87,7 +87,7 @@ func mkAPIResponse(start, end, step int64) *PrometheusResponse {
 	}
 
 	return &PrometheusResponse{
-		Status: statusSuccess,
+		Status: StatusSuccess,
 		Data: PrometheusData{
 			ResultType: matrix,
 			Result: []SampleStream{
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index 6e87d78c6e5..d55db7893fc 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -25,8 +25,11 @@ import (
 
 	"github.com/go-kit/kit/log"
 	"github.com/go-kit/kit/log/level"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/promql"
 	"github.com/weaveworks/common/user"
 
+	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/chunk/cache"
 	"github.com/cortexproject/cortex/pkg/querier/frontend"
 )
@@ -41,6 +44,7 @@ type Config struct {
 	ResultsCacheConfig     `yaml:"results_cache"`
 	CacheResults           bool `yaml:"cache_results"`
 	MaxRetries             int  `yaml:"max_retries"`
+	SumShards              bool `yaml:"sum_shards"`
 }
 
 // RegisterFlags adds the flags required to config this to the given FlagSet.
@@ -50,6 +54,7 @@ func (cfg *Config) RegisterFlags(f *flag.FlagSet) {
 	f.DurationVar(&cfg.SplitQueriesByInterval, "querier.split-queries-by-interval", 0, "Split queries by an interval and execute in parallel, 0 disables it. You should use an a multiple of 24 hours (same as the storage bucketing scheme), to avoid queriers downloading and processing the same chunks. This also determines how cache keys are chosen when result caching is enabled")
 	f.BoolVar(&cfg.AlignQueriesWithStep, "querier.align-querier-with-step", false, "Mutate incoming queries to align their start and end with their step.")
 	f.BoolVar(&cfg.CacheResults, "querier.cache-results", false, "Cache query results.")
+	f.BoolVar(&cfg.SumShards, "querier.sum-shards", false, "Parse the ast and parallelize sums by shard.")
 	cfg.ResultsCacheConfig.RegisterFlags(f)
 }
 
@@ -104,7 +109,16 @@ func MergeMiddlewares(middleware ...Middleware) Middleware {
 }
 
 // NewTripperware returns a Tripperware configured with middlewares to limit, align, split, retry and cache requests.
-func NewTripperware(cfg Config, log log.Logger, limits Limits, codec Codec, cacheExtractor Extractor) (frontend.Tripperware, cache.Cache, error) {
+func NewTripperware(
+	cfg Config,
+	log log.Logger,
+	limits Limits,
+	codec Codec,
+	cacheExtractor Extractor,
+	schema chunk.SchemaConfig,
+	engineOpts promql.EngineOpts,
+	minShardingLookback time.Duration,
+) (frontend.Tripperware, cache.Cache, error) {
 	queryRangeMiddleware := []Middleware{LimitsMiddleware(limits)}
 	if cfg.AlignQueriesWithStep {
 		queryRangeMiddleware = append(queryRangeMiddleware, InstrumentMiddleware("step_align"), StepAlignMiddleware)
@@ -112,6 +126,7 @@ func NewTripperware(cfg Config, log log.Logger, limits Limits, codec Codec, cach
 	if cfg.SplitQueriesByInterval != 0 {
 		queryRangeMiddleware = append(queryRangeMiddleware, InstrumentMiddleware("split_by_interval"), SplitByIntervalMiddleware(cfg.SplitQueriesByInterval, limits, codec))
 	}
+
 	var c cache.Cache
 	if cfg.CacheResults {
 		queryCacheMiddleware, cache, err := NewResultsCacheMiddleware(log, cfg.ResultsCacheConfig, constSplitter(cfg.SplitQueriesByInterval), limits, codec, cacheExtractor)
@@ -121,6 +136,27 @@ func NewTripperware(cfg Config, log log.Logger, limits Limits, codec Codec, cach
 		c = cache
 		queryRangeMiddleware = append(queryRangeMiddleware, InstrumentMiddleware("results_cache"), queryCacheMiddleware)
 	}
+
+	if cfg.SumShards {
+
+		if minShardingLookback == 0 {
+			return nil, nil, errors.New("a non-zero value is required for querier.query-ingesters-within when querier.sum-shards is enabled")
+		}
+
+		shardingware := NewQueryShardMiddleware(
+			log,
+			promql.NewEngine(engineOpts),
+			schema.Configs,
+			codec,
+			minShardingLookback,
+		)
+
+		queryRangeMiddleware = append(
+			queryRangeMiddleware,
+			shardingware, // instrumentation is included in the sharding middleware
+		)
+	}
+
 	if cfg.MaxRetries > 0 {
 		queryRangeMiddleware = append(queryRangeMiddleware, InstrumentMiddleware("retry"), NewRetryMiddleware(log, cfg.MaxRetries))
 	}
diff --git a/pkg/querier/queryrange/roundtrip_test.go b/pkg/querier/queryrange/roundtrip_test.go
index 1d0491c252c..65e04e1e5c7 100644
--- a/pkg/querier/queryrange/roundtrip_test.go
+++ b/pkg/querier/queryrange/roundtrip_test.go
@@ -8,7 +8,12 @@ import (
 	"net/url"
 	"strconv"
 	"testing"
+	"time"
 
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/util"
+	"github.com/go-kit/kit/log"
+	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
 	"github.com/weaveworks/common/middleware"
 	"github.com/weaveworks/common/user"
@@ -42,7 +47,22 @@ func TestRoundTrip(t *testing.T) {
 		next: http.DefaultTransport,
 	}
 
-	tw, _, err := NewTripperware(Config{}, util.Logger, fakeLimits{}, PrometheusCodec, nil)
+	tw, _, err := NewTripperware(Config{},
+		util.Logger,
+		fakeLimits{},
+		PrometheusCodec,
+		nil,
+		chunk.SchemaConfig{},
+		promql.EngineOpts{
+			Logger:        util.Logger,
+			Reg:           nil,
+			MaxConcurrent: 10,
+			MaxSamples:    1000,
+			Timeout:       time.Minute,
+		},
+		0,
+	)
+
 	if err != nil {
 		t.Fatal(err)
 	}
@@ -86,3 +106,18 @@ func (s singleHostRoundTripper) RoundTrip(r *http.Request) (*http.Response, erro
 	r.URL.Host = s.host
 	return s.next.RoundTrip(r)
 }
+
+func Test_ShardingConfigError(t *testing.T) {
+	_, _, err := NewTripperware(
+		Config{SumShards: true},
+		log.NewNopLogger(),
+		nil,
+		nil,
+		nil,
+		chunk.SchemaConfig{},
+		promql.EngineOpts{},
+		0,
+	)
+
+	require.EqualError(t, err, "a non-zero value is required for querier.query-ingesters-within when querier.sum-shards is enabled")
+}
diff --git a/pkg/querier/queryrange/series.go b/pkg/querier/queryrange/series.go
new file mode 100644
index 00000000000..85a7b135531
--- /dev/null
+++ b/pkg/querier/queryrange/series.go
@@ -0,0 +1,55 @@
+package queryrange
+
+import (
+	"github.com/cortexproject/cortex/pkg/querier/series"
+	"github.com/pkg/errors"
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/prometheus/prometheus/storage"
+)
+
+// ResponseToSamples is needed to map back from api response to the underlying series data
+func ResponseToSamples(resp Response) ([]SampleStream, error) {
+	promRes, ok := resp.(*PrometheusResponse)
+	if !ok {
+		return nil, errors.Errorf("error invalid response type: %T, expected: %T", resp, &PrometheusResponse{})
+	}
+	if promRes.Error != "" {
+		return nil, errors.New(promRes.Error)
+	}
+	switch promRes.Data.ResultType {
+	case promql.ValueTypeVector, promql.ValueTypeMatrix:
+		return promRes.Data.Result, nil
+	}
+
+	return nil, errors.Errorf(
+		"Invalid promql.Value type: [%s]. Only %s and %s supported",
+		promRes.Data.ResultType,
+		promql.ValueTypeVector,
+		promql.ValueTypeMatrix,
+	)
+}
+
+// NewSeriesSet returns an in memory storage.SeriesSet from a []SampleStream
+func NewSeriesSet(results []SampleStream) storage.SeriesSet {
+
+	set := make([]storage.Series, 0, len(results))
+
+	for _, stream := range results {
+		samples := make([]model.SamplePair, 0, len(stream.Samples))
+		for _, sample := range stream.Samples {
+			samples = append(samples, model.SamplePair{
+				Timestamp: model.Time(sample.TimestampMs),
+				Value:     model.SampleValue(sample.Value),
+			})
+		}
+
+		ls := make([]labels.Label, 0, len(stream.Labels))
+		for _, l := range stream.Labels {
+			ls = append(ls, labels.Label(l))
+		}
+		set = append(set, series.NewConcreteSeries(ls, samples))
+	}
+	return series.NewConcreteSeriesSet(set)
+}
diff --git a/pkg/querier/queryrange/series_test.go b/pkg/querier/queryrange/series_test.go
new file mode 100644
index 00000000000..262503e8538
--- /dev/null
+++ b/pkg/querier/queryrange/series_test.go
@@ -0,0 +1,75 @@
+package queryrange
+
+import (
+	"testing"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func Test_ResponseToSamples(t *testing.T) {
+	input := &PrometheusResponse{
+		Data: PrometheusData{
+			ResultType: promql.ValueTypeMatrix,
+			Result: []SampleStream{
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       1,
+							TimestampMs: 1,
+						},
+						{
+							Value:       2,
+							TimestampMs: 2,
+						},
+					},
+				},
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       8,
+							TimestampMs: 1,
+						},
+						{
+							Value:       9,
+							TimestampMs: 2,
+						},
+					},
+				},
+			},
+		},
+	}
+
+	streams, err := ResponseToSamples(input)
+	require.Nil(t, err)
+	set := NewSeriesSet(streams)
+
+	setCt := 0
+
+	for set.Next() {
+		iter := set.At().Iterator()
+		require.Nil(t, set.Err())
+
+		sampleCt := 0
+		for iter.Next() {
+			ts, v := iter.At()
+			require.Equal(t, input.Data.Result[setCt].Samples[sampleCt].TimestampMs, ts)
+			require.Equal(t, input.Data.Result[setCt].Samples[sampleCt].Value, v)
+			sampleCt++
+		}
+		require.Equal(t, len(input.Data.Result[setCt].Samples), sampleCt)
+		setCt++
+	}
+
+	require.Equal(t, len(input.Data.Result), setCt)
+
+}
diff --git a/pkg/querier/queryrange/test_utils.go b/pkg/querier/queryrange/test_utils.go
new file mode 100644
index 00000000000..0eb68a394b3
--- /dev/null
+++ b/pkg/querier/queryrange/test_utils.go
@@ -0,0 +1,186 @@
+package queryrange
+
+import (
+	"context"
+	"fmt"
+	"time"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/querier/series"
+	"github.com/pkg/errors"
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/storage"
+)
+
+// genLabels will create a slice of labels where each label has an equal chance to occupy a value from [0,labelBuckets]. It returns a slice of length labelBuckets^len(labelSet)
+func genLabels(
+	labelSet []string,
+	labelBuckets int,
+) (result []labels.Labels) {
+	if len(labelSet) == 0 {
+		return result
+	}
+
+	l := labelSet[0]
+	rest := genLabels(labelSet[1:], labelBuckets)
+
+	for i := 0; i < labelBuckets; i++ {
+		x := labels.Label{
+			Name:  l,
+			Value: fmt.Sprintf("%d", i),
+		}
+		if len(rest) == 0 {
+			set := labels.Labels{x}
+			result = append(result, set)
+			continue
+		}
+		for _, others := range rest {
+			set := append(others, x)
+			result = append(result, set)
+		}
+	}
+	return result
+
+}
+
+// NewMockShardedQueryable creates a shard-aware in memory queryable.
+func NewMockShardedQueryable(
+	nSamples int,
+	labelSet []string,
+	labelBuckets int,
+	delayPerSeries time.Duration,
+) *MockShardedQueryable {
+	samples := make([]model.SamplePair, 0, nSamples)
+	for i := 0; i < nSamples; i++ {
+		samples = append(samples, model.SamplePair{
+			Timestamp: model.Time(i * 1000),
+			Value:     model.SampleValue(i),
+		})
+	}
+	sets := genLabels(labelSet, labelBuckets)
+	xs := make([]storage.Series, 0, len(sets))
+	for _, ls := range sets {
+		xs = append(xs, series.NewConcreteSeries(ls, samples))
+	}
+
+	return &MockShardedQueryable{
+		series:         xs,
+		delayPerSeries: delayPerSeries,
+	}
+}
+
+// MockShardedQueryable is exported to be reused in the querysharding benchmarking
+type MockShardedQueryable struct {
+	series         []storage.Series
+	delayPerSeries time.Duration
+}
+
+// Querier impls storage.Queryable
+func (q *MockShardedQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
+	return q, nil
+}
+
+// Select impls storage.Querier
+func (q *MockShardedQueryable) Select(
+	_ *storage.SelectParams,
+	matchers ...*labels.Matcher,
+) (storage.SeriesSet, storage.Warnings, error) {
+	tStart := time.Now()
+
+	shard, _, err := astmapper.ShardFromMatchers(matchers)
+	if err != nil {
+		return nil, nil, err
+	}
+
+	var (
+		start int
+		end   int
+	)
+
+	if shard == nil {
+		start = 0
+		end = len(q.series)
+	} else {
+		// return the series range associated with this shard
+		seriesPerShard := len(q.series) / shard.Of
+		start = shard.Shard * seriesPerShard
+		end = start + seriesPerShard
+
+		// if we're clipping an odd # of series, add the final series to the last shard
+		if end == len(q.series)-1 && len(q.series)%2 == 1 {
+			end = len(q.series)
+		}
+	}
+
+	var name string
+	for _, m := range matchers {
+		if m.Type == labels.MatchEqual && m.Name == "__name__" {
+			name = m.Value
+		}
+	}
+
+	results := make([]storage.Series, 0, end-start)
+	for i := start; i < end; i++ {
+		results = append(results, &ShardLabelSeries{
+			shard:  shard,
+			name:   name,
+			Series: q.series[i],
+		})
+	}
+
+	// loosely enforce the assumption that an operation on 1/nth of the data
+	// takes 1/nth of the time.
+	duration := q.delayPerSeries * time.Duration(len(q.series))
+	if shard != nil {
+		duration = duration / time.Duration(shard.Of)
+	}
+
+	remaining := time.Until(tStart.Add(duration))
+	if remaining > 0 {
+		time.Sleep(remaining)
+	}
+
+	return series.NewConcreteSeriesSet(results), nil, nil
+
+}
+
+// ShardLabelSeries allows extending a Series with new labels. This is helpful for adding cortex shard labels
+type ShardLabelSeries struct {
+	shard *astmapper.ShardAnnotation
+	name  string
+	storage.Series
+}
+
+// Labels impls storage.Series
+func (s *ShardLabelSeries) Labels() labels.Labels {
+	ls := s.Series.Labels()
+
+	if s.name != "" {
+		ls = append(ls, labels.Label{
+			Name:  "__name__",
+			Value: s.name,
+		})
+	}
+
+	if s.shard != nil {
+		ls = append(ls, s.shard.Label())
+	}
+
+	return ls
+}
+
+// LabelValues impls storage.Querier
+func (q *MockShardedQueryable) LabelValues(name string) ([]string, storage.Warnings, error) {
+	return nil, nil, errors.Errorf("unimplemented")
+}
+
+// LabelNames returns all the unique label names present in the block in sorted order.
+func (q *MockShardedQueryable) LabelNames() ([]string, storage.Warnings, error) {
+	return nil, nil, errors.Errorf("unimplemented")
+}
+
+// Close releases the resources of the Querier.
+func (q *MockShardedQueryable) Close() error {
+	return nil
+}
diff --git a/pkg/querier/queryrange/test_utils_test.go b/pkg/querier/queryrange/test_utils_test.go
new file mode 100644
index 00000000000..8e5f187b927
--- /dev/null
+++ b/pkg/querier/queryrange/test_utils_test.go
@@ -0,0 +1,134 @@
+package queryrange
+
+import (
+	"math"
+	"sort"
+	"testing"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/stretchr/testify/require"
+)
+
+func TestGenLabelsCorrectness(t *testing.T) {
+	ls := genLabels([]string{"a", "b"}, 2)
+	for _, set := range ls {
+		sort.Sort(set)
+	}
+	expected := []labels.Labels{
+		{
+			labels.Label{
+				Name:  "a",
+				Value: "0",
+			},
+			labels.Label{
+				Name:  "b",
+				Value: "0",
+			},
+		},
+		{
+			labels.Label{
+				Name:  "a",
+				Value: "0",
+			},
+			labels.Label{
+				Name:  "b",
+				Value: "1",
+			},
+		},
+		{
+			labels.Label{
+				Name:  "a",
+				Value: "1",
+			},
+			labels.Label{
+				Name:  "b",
+				Value: "0",
+			},
+		},
+		{
+			labels.Label{
+				Name:  "a",
+				Value: "1",
+			},
+			labels.Label{
+				Name:  "b",
+				Value: "1",
+			},
+		},
+	}
+	require.Equal(t, expected, ls)
+}
+
+func TestGenLabelsSize(t *testing.T) {
+	for _, tc := range []struct {
+		set     []string
+		buckets int
+	}{
+		{
+			set:     []string{"a", "b"},
+			buckets: 5,
+		},
+		{
+			set:     []string{"a", "b", "c"},
+			buckets: 10,
+		},
+	} {
+		sets := genLabels(tc.set, tc.buckets)
+		require.Equal(
+			t,
+			math.Pow(float64(tc.buckets), float64(len(tc.set))),
+			float64(len(sets)),
+		)
+	}
+}
+
+func TestNewMockShardedqueryable(t *testing.T) {
+	for _, tc := range []struct {
+		shards, nSamples, labelBuckets int
+		labelSet                       []string
+	}{
+		{
+			nSamples:     100,
+			shards:       1,
+			labelBuckets: 3,
+			labelSet:     []string{"a", "b", "c"},
+		},
+		{
+			nSamples:     0,
+			shards:       2,
+			labelBuckets: 3,
+			labelSet:     []string{"a", "b", "c"},
+		},
+	} {
+		q := NewMockShardedQueryable(tc.nSamples, tc.labelSet, tc.labelBuckets, 0)
+		expectedSeries := int(math.Pow(float64(tc.labelBuckets), float64(len(tc.labelSet))))
+
+		seriesCt := 0
+		for i := 0; i < tc.shards; i++ {
+
+			set, _, err := q.Select(nil, &labels.Matcher{
+				Type: labels.MatchEqual,
+				Name: astmapper.ShardLabel,
+				Value: astmapper.ShardAnnotation{
+					Shard: i,
+					Of:    tc.shards,
+				}.String(),
+			})
+
+			require.Nil(t, err)
+
+			for set.Next() {
+				seriesCt++
+				iter := set.At().Iterator()
+				samples := 0
+				for iter.Next() {
+					samples++
+				}
+				require.Equal(t, tc.nSamples, samples)
+			}
+
+		}
+		require.Equal(t, expectedSeries, seriesCt)
+	}
+}
diff --git a/pkg/querier/queryrange/value.go b/pkg/querier/queryrange/value.go
new file mode 100644
index 00000000000..23f519bff56
--- /dev/null
+++ b/pkg/querier/queryrange/value.go
@@ -0,0 +1,73 @@
+package queryrange
+
+import (
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+)
+
+// FromResult transforms a promql query result into a samplestream
+func FromResult(res *promql.Result) ([]SampleStream, error) {
+	if res.Err != nil {
+		return nil, res.Err
+	}
+	switch v := res.Value.(type) {
+	case promql.Scalar:
+		return []SampleStream{
+			{
+				Samples: []client.Sample{
+					{
+						Value:       v.V,
+						TimestampMs: v.T,
+					},
+				},
+			},
+		}, nil
+
+	case promql.Vector:
+		res := make([]SampleStream, 0, len(v))
+		for _, sample := range v {
+			res = append(res, SampleStream{
+				Labels:  mapLabels(sample.Metric),
+				Samples: mapPoints(sample.Point),
+			})
+		}
+		return res, nil
+
+	case promql.Matrix:
+		res := make([]SampleStream, 0, len(v))
+		for _, series := range v {
+			res = append(res, SampleStream{
+				Labels:  mapLabels(series.Metric),
+				Samples: mapPoints(series.Points...),
+			})
+		}
+		return res, nil
+
+	}
+
+	return nil, errors.Errorf("Unexpected value type: [%s]", res.Value.Type())
+}
+
+func mapLabels(ls labels.Labels) []client.LabelAdapter {
+	result := make([]client.LabelAdapter, 0, len(ls))
+	for _, l := range ls {
+		result = append(result, client.LabelAdapter(l))
+	}
+
+	return result
+}
+
+func mapPoints(pts ...promql.Point) []client.Sample {
+	result := make([]client.Sample, 0, len(pts))
+
+	for _, pt := range pts {
+		result = append(result, client.Sample{
+			Value:       pt.V,
+			TimestampMs: pt.T,
+		})
+	}
+
+	return result
+}
diff --git a/pkg/querier/queryrange/value_test.go b/pkg/querier/queryrange/value_test.go
new file mode 100644
index 00000000000..524c2e83d90
--- /dev/null
+++ b/pkg/querier/queryrange/value_test.go
@@ -0,0 +1,167 @@
+package queryrange
+
+import (
+	"fmt"
+	"testing"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/pkg/errors"
+	"github.com/prometheus/prometheus/pkg/labels"
+	"github.com/prometheus/prometheus/promql"
+	"github.com/stretchr/testify/require"
+)
+
+func TestFromValue(t *testing.T) {
+	var testExpr = []struct {
+		input    *promql.Result
+		err      bool
+		expected []SampleStream
+	}{
+		// string (errors)
+		{
+			input: &promql.Result{Value: promql.String{T: 1, V: "hi"}},
+			err:   true,
+		},
+		{
+			input: &promql.Result{Err: errors.New("foo")},
+			err:   true,
+		},
+		// Scalar
+		{
+			input: &promql.Result{Value: promql.Scalar{T: 1, V: 1}},
+			err:   false,
+			expected: []SampleStream{
+				{
+					Samples: []client.Sample{
+						{
+							Value:       1,
+							TimestampMs: 1,
+						},
+					},
+				},
+			},
+		},
+		// Vector
+		{
+			input: &promql.Result{
+				Value: promql.Vector{
+					promql.Sample{
+						Point: promql.Point{T: 1, V: 1},
+						Metric: labels.Labels{
+							{Name: "a", Value: "a1"},
+							{Name: "b", Value: "b1"},
+						},
+					},
+					promql.Sample{
+						Point: promql.Point{T: 2, V: 2},
+						Metric: labels.Labels{
+							{Name: "a", Value: "a2"},
+							{Name: "b", Value: "b2"},
+						},
+					},
+				},
+			},
+			err: false,
+			expected: []SampleStream{
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       1,
+							TimestampMs: 1,
+						},
+					},
+				},
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a2"},
+						{Name: "b", Value: "b2"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       2,
+							TimestampMs: 2,
+						},
+					},
+				},
+			},
+		},
+		// Matrix
+		{
+			input: &promql.Result{
+				Value: promql.Matrix{
+					{
+						Metric: labels.Labels{
+							{Name: "a", Value: "a1"},
+							{Name: "b", Value: "b1"},
+						},
+						Points: []promql.Point{
+							{T: 1, V: 1},
+							{T: 2, V: 2},
+						},
+					},
+					{
+						Metric: labels.Labels{
+							{Name: "a", Value: "a2"},
+							{Name: "b", Value: "b2"},
+						},
+						Points: []promql.Point{
+							{T: 1, V: 8},
+							{T: 2, V: 9},
+						},
+					},
+				},
+			},
+			err: false,
+			expected: []SampleStream{
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a1"},
+						{Name: "b", Value: "b1"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       1,
+							TimestampMs: 1,
+						},
+						{
+							Value:       2,
+							TimestampMs: 2,
+						},
+					},
+				},
+				{
+					Labels: []client.LabelAdapter{
+						{Name: "a", Value: "a2"},
+						{Name: "b", Value: "b2"},
+					},
+					Samples: []client.Sample{
+						{
+							Value:       8,
+							TimestampMs: 1,
+						},
+						{
+							Value:       9,
+							TimestampMs: 2,
+						},
+					},
+				},
+			},
+		},
+	}
+
+	for i, c := range testExpr {
+		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
+			result, err := FromResult(c.input)
+			if c.err {
+				require.NotNil(t, err)
+			} else {
+				require.Nil(t, err)
+				require.Equal(t, c.expected, result)
+			}
+		})
+	}
+}
diff --git a/pkg/querier/remote_read_test.go b/pkg/querier/remote_read_test.go
index 1b29f2bd592..9f4fea14439 100644
--- a/pkg/querier/remote_read_test.go
+++ b/pkg/querier/remote_read_test.go
@@ -9,6 +9,8 @@ import (
 	"net/http/httptest"
 	"testing"
 
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/gogo/protobuf/proto"
 	"github.com/golang/snappy"
 	"github.com/prometheus/common/model"
@@ -90,7 +92,7 @@ func (m mockQuerier) Select(sp *storage.SelectParams, matchers ...*labels.Matche
 	if sp == nil {
 		panic(fmt.Errorf("select params must be set"))
 	}
-	return matrixToSeriesSet(m.matrix), nil, nil
+	return series.MatrixToSeriesSet(m.matrix), nil, nil
 }
 
 func (m mockQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
diff --git a/pkg/querier/series_set.go b/pkg/querier/series/series_set.go
similarity index 64%
rename from pkg/querier/series_set.go
rename to pkg/querier/series/series_set.go
index 2b5c66d1908..4f11dde09ca 100644
--- a/pkg/querier/series_set.go
+++ b/pkg/querier/series/series_set.go
@@ -14,7 +14,7 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
-package querier
+package series
 
 import (
 	"sort"
@@ -26,61 +26,69 @@ import (
 	"github.com/cortexproject/cortex/pkg/prom1/storage/metric"
 )
 
-// concreteSeriesSet implements storage.SeriesSet.
-type concreteSeriesSet struct {
+// ConcreteSeriesSet implements storage.SeriesSet.
+type ConcreteSeriesSet struct {
 	cur    int
 	series []storage.Series
 }
 
-func newConcreteSeriesSet(series []storage.Series) storage.SeriesSet {
+// NewConcreteSeriesSet instantiates an in-memory series set from a series
+func NewConcreteSeriesSet(series []storage.Series) storage.SeriesSet {
 	sort.Sort(byLabels(series))
-	return &concreteSeriesSet{
+	return &ConcreteSeriesSet{
 		cur:    -1,
 		series: series,
 	}
 }
 
-func (c *concreteSeriesSet) Next() bool {
+// Next iterates through a series set and impls storage.SeriesSet
+func (c *ConcreteSeriesSet) Next() bool {
 	c.cur++
 	return c.cur < len(c.series)
 }
 
-func (c *concreteSeriesSet) At() storage.Series {
+// At returns the current series and impls storage.SeriesSet
+func (c *ConcreteSeriesSet) At() storage.Series {
 	return c.series[c.cur]
 }
 
-func (c *concreteSeriesSet) Err() error {
+// Err impls storage.SeriesSet
+func (c *ConcreteSeriesSet) Err() error {
 	return nil
 }
 
-// concreteSeries implements storage.Series.
-type concreteSeries struct {
+// ConcreteSeries implements storage.Series.
+type ConcreteSeries struct {
 	labels  labels.Labels
 	samples []model.SamplePair
 }
 
-func newConcreteSeries(ls labels.Labels, samples []model.SamplePair) *concreteSeries {
-	return &concreteSeries{
+// NewConcreteSeries instantiates an in memory series from a list of samples & labels
+func NewConcreteSeries(ls labels.Labels, samples []model.SamplePair) *ConcreteSeries {
+	return &ConcreteSeries{
 		labels:  ls,
 		samples: samples,
 	}
 }
 
-func (c *concreteSeries) Labels() labels.Labels {
+// Labels impls storage.Series
+func (c *ConcreteSeries) Labels() labels.Labels {
 	return c.labels
 }
 
-func (c *concreteSeries) Iterator() storage.SeriesIterator {
-	return newConcreteSeriesIterator(c)
+// Iterator impls storage.Series
+func (c *ConcreteSeries) Iterator() storage.SeriesIterator {
+	return NewConcreteSeriesIterator(c)
 }
 
 // concreteSeriesIterator implements storage.SeriesIterator.
 type concreteSeriesIterator struct {
 	cur    int
-	series *concreteSeries
+	series *ConcreteSeries
 }
 
-func newConcreteSeriesIterator(series *concreteSeries) storage.SeriesIterator {
+// NewConcreteSeriesIterator instaniates an in memory storage.SeriesIterator
+func NewConcreteSeriesIterator(series *ConcreteSeries) storage.SeriesIterator {
 	return &concreteSeriesIterator{
 		cur:    -1,
 		series: series,
@@ -108,6 +116,11 @@ func (c *concreteSeriesIterator) Err() error {
 	return nil
 }
 
+// NewErrIterator instantiates an errIterator
+func NewErrIterator(err error) storage.SeriesIterator {
+	return errIterator{err}
+}
+
 // errIterator implements storage.SeriesIterator, just returning an error.
 type errIterator struct {
 	err error
@@ -129,26 +142,28 @@ func (e errIterator) Err() error {
 	return e.err
 }
 
-func matrixToSeriesSet(m model.Matrix) storage.SeriesSet {
+// MatrixToSeriesSet creates a storage.SeriesSet from a model.Matrix
+func MatrixToSeriesSet(m model.Matrix) storage.SeriesSet {
 	series := make([]storage.Series, 0, len(m))
 	for _, ss := range m {
-		series = append(series, &concreteSeries{
+		series = append(series, &ConcreteSeries{
 			labels:  metricToLabels(ss.Metric),
 			samples: ss.Values,
 		})
 	}
-	return newConcreteSeriesSet(series)
+	return NewConcreteSeriesSet(series)
 }
 
-func metricsToSeriesSet(ms []metric.Metric) storage.SeriesSet {
+// MetricsToSeriesSet creates a storage.SeriesSet from a []metric.Metric
+func MetricsToSeriesSet(ms []metric.Metric) storage.SeriesSet {
 	series := make([]storage.Series, 0, len(ms))
 	for _, m := range ms {
-		series = append(series, &concreteSeries{
+		series = append(series, &ConcreteSeries{
 			labels:  metricToLabels(m.Metric),
 			samples: nil,
 		})
 	}
-	return newConcreteSeriesSet(series)
+	return NewConcreteSeriesSet(series)
 }
 
 func metricToLabels(m model.Metric) labels.Labels {
diff --git a/pkg/querier/series_set_test.go b/pkg/querier/series/series_set_test.go
similarity index 88%
rename from pkg/querier/series_set_test.go
rename to pkg/querier/series/series_set_test.go
index a1244b57f4d..a8ca1ae4efc 100644
--- a/pkg/querier/series_set_test.go
+++ b/pkg/querier/series/series_set_test.go
@@ -1,4 +1,4 @@
-package querier
+package series
 
 import (
 	"testing"
@@ -10,15 +10,15 @@ import (
 )
 
 func TestConcreteSeriesSet(t *testing.T) {
-	series1 := &concreteSeries{
+	series1 := &ConcreteSeries{
 		labels:  labels.FromStrings("foo", "bar"),
 		samples: []model.SamplePair{{Value: 1, Timestamp: 2}},
 	}
-	series2 := &concreteSeries{
+	series2 := &ConcreteSeries{
 		labels:  labels.FromStrings("foo", "baz"),
 		samples: []model.SamplePair{{Value: 3, Timestamp: 4}},
 	}
-	c := newConcreteSeriesSet([]storage.Series{series2, series1})
+	c := NewConcreteSeriesSet([]storage.Series{series2, series1})
 	require.True(t, c.Next())
 	require.Equal(t, series1, c.At())
 	require.True(t, c.Next())
@@ -39,7 +39,7 @@ func TestMatrixToSeriesSetSortsMetricLabels(t *testing.T) {
 			Values: []model.SamplePair{{Timestamp: 0, Value: 0}},
 		},
 	}
-	ss := matrixToSeriesSet(matrix)
+	ss := MatrixToSeriesSet(matrix)
 	require.True(t, ss.Next())
 	require.NoError(t, ss.Err())
 
diff --git a/pkg/querier/unified_querier.go b/pkg/querier/unified_querier.go
index 8211f04cc29..04815637e2f 100644
--- a/pkg/querier/unified_querier.go
+++ b/pkg/querier/unified_querier.go
@@ -9,9 +9,10 @@ import (
 	"github.com/weaveworks/common/user"
 
 	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 )
 
-func newUnifiedChunkQueryable(ds, cs ChunkStore, distributor Distributor, chunkIteratorFunc chunkIteratorFunc, cfg Config) storage.Queryable {
+func newUnifiedChunkQueryable(ds, cs chunkstore.ChunkStore, distributor Distributor, chunkIteratorFunc chunkIteratorFunc, cfg Config) storage.Queryable {
 	return storage.QueryableFunc(func(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
 		ucq := &unifiedChunkQuerier{
 			querier: querier{
@@ -44,7 +45,7 @@ func newUnifiedChunkQueryable(ds, cs ChunkStore, distributor Distributor, chunkI
 }
 
 type unifiedChunkQuerier struct {
-	stores []ChunkStore
+	stores []chunkstore.ChunkStore
 
 	// We reuse metadataQuery, LabelValues and Close from querier.
 	querier
@@ -57,7 +58,7 @@ func (q *unifiedChunkQuerier) Get(ctx context.Context, userID string, from, thro
 	css := make(chan []chunk.Chunk, len(q.stores))
 	errs := make(chan error, len(q.stores))
 	for _, store := range q.stores {
-		go func(store ChunkStore) {
+		go func(store chunkstore.ChunkStore) {
 			cs, err := store.Get(ctx, userID, from, through, matchers...)
 			if err != nil {
 				errs <- err
diff --git a/tools/query-audit/auditor.go b/tools/query-audit/auditor.go
new file mode 100644
index 00000000000..17ff61c3dbe
--- /dev/null
+++ b/tools/query-audit/auditor.go
@@ -0,0 +1,92 @@
+package main
+
+import (
+	"math"
+
+	"github.com/pkg/errors"
+	"github.com/prometheus/common/model"
+)
+
+// Auditor is a struct for auditing prometheus queries
+type Auditor struct{}
+
+// Diff stores a difference between two queries
+type Diff struct {
+	Series      int
+	Diff        float64   // avg proportional diff across all series & samples
+	sampleDiffs []float64 // proportional diffs as measured by x/control
+}
+
+// Audit audits two prometheus queries
+func (a *Auditor) Audit(control, x model.Value) (Diff, error) {
+	if x.Type() == model.ValMatrix && control.Type() == model.ValMatrix {
+		return a.auditMatrix(x.(model.Matrix), control.(model.Matrix))
+	}
+
+	if x.Type() == model.ValVector && control.Type() == model.ValVector {
+		return a.auditVector(x.(model.Vector), control.(model.Vector))
+	}
+
+	return Diff{}, errors.Errorf("unsupported types for equality: got %s & %s", control.Type().String(), x.Type().String())
+}
+
+func (a *Auditor) auditMatrix(x, y model.Matrix) (diff Diff, err error) {
+	// different # of returned series
+	if len(x) != len(y) {
+		return diff, errors.Errorf("different # of series: control=%d, other=%d", len(x), len(y))
+	}
+
+	for i := 0; i < len(x); i++ {
+		xSeries, ySeries := x[i], y[i]
+		if !xSeries.Metric.Equal(ySeries.Metric) {
+			return diff, errors.Errorf("mismatched metrics: %v vs %v", xSeries.Metric, ySeries.Metric)
+		}
+
+		xVals, yVals := xSeries.Values, ySeries.Values
+		if len(xVals) != len(yVals) {
+			return diff, errors.Errorf(
+				"mismatched number of samples for series %v. control=%d, other=%d",
+				xSeries.Metric,
+				len(xVals),
+				len(yVals),
+			)
+		}
+
+		for j := 0; j < len(xVals); j++ {
+			xSample, ySample := xVals[j], yVals[j]
+
+			if xSample.Timestamp != ySample.Timestamp {
+				return diff, errors.Errorf(
+					"mismatched timestamp for %d sample of series %v. control=%d, other=%d",
+					j,
+					xSeries.Metric,
+					xSample.Timestamp,
+					ySample.Timestamp,
+				)
+			}
+
+			absDiff := math.Abs(float64(ySample.Value-xSample.Value)) / math.Abs(float64(xSample.Value))
+
+			// 0/0 -> no diff
+			if math.IsNaN(absDiff) {
+				absDiff = 0
+			}
+
+			diff.sampleDiffs = append(diff.sampleDiffs, absDiff)
+
+		}
+	}
+
+	diff.Series = len(x)
+	var avgDiffProportion float64
+	for _, d := range diff.sampleDiffs {
+		avgDiffProportion += d
+	}
+	diff.Diff = avgDiffProportion / float64(len(diff.sampleDiffs))
+
+	return diff, nil
+}
+
+func (a *Auditor) auditVector(x, y model.Vector) (Diff, error) {
+	return Diff{}, errors.New("unimplemented")
+}
diff --git a/tools/query-audit/config.go b/tools/query-audit/config.go
new file mode 100644
index 00000000000..d1035fc1b49
--- /dev/null
+++ b/tools/query-audit/config.go
@@ -0,0 +1,67 @@
+package main
+
+import (
+	"io/ioutil"
+	"time"
+
+	"github.com/pkg/errors"
+
+	"sigs.k8s.io/yaml"
+)
+
+type Backend struct {
+	Host    string            `yaml:"host" json:"host"`
+	Headers map[string]string `yaml:"headers" json:"headers"`
+}
+
+type Query struct {
+	Query       string    `yaml:"query" json:"query"`
+	Start       time.Time `yaml:"start" json:"start"`
+	End         time.Time `yaml:"end" json:"end"`
+	StepSizeStr string    `yaml:"step_size" json:"step_size"`
+	StepSize    time.Duration
+}
+
+func (q *Query) Validate() error {
+	parsedDur, err := time.ParseDuration(q.StepSizeStr)
+	if err != nil {
+		return err
+	}
+
+	q.StepSize = parsedDur
+
+	if q.StepSize == time.Duration(0) {
+		q.StepSize = time.Minute
+	}
+	return nil
+}
+
+type Config struct {
+	Control Backend  `yaml:"control" json:"control"`
+	Test    Backend  `yaml:"test" json:"test"`
+	Queries []*Query `yaml:"queries" json:"queries"`
+}
+
+func (cfg *Config) Validate() error {
+	for _, q := range cfg.Queries {
+		if err := q.Validate(); err != nil {
+			return err
+		}
+	}
+	return nil
+}
+
+// LoadConfig read YAML-formatted config from filename into cfg.
+func LoadConfig(filename string, cfg *Config) error {
+	buf, err := ioutil.ReadFile(filename)
+	if err != nil {
+		return errors.Wrap(err, "Error reading config file")
+	}
+
+	err = yaml.Unmarshal(buf, cfg)
+	if err != nil {
+		return errors.Wrap(err, "Error parsing config file")
+	}
+
+	return cfg.Validate()
+}
diff --git a/tools/query-audit/example-config.yaml b/tools/query-audit/example-config.yaml
new file mode 100644
index 00000000000..11ffeeb7a5a
--- /dev/null
+++ b/tools/query-audit/example-config.yaml
@@ -0,0 +1,37 @@
+control:
+  host: http://localhost:8080/api/prom
+  headers:
+    "X-Scope-OrgID": 1234
+
+test:
+  host: http://localhost:8081/api/prom
+  headers:
+    "X-Scope-OrgID": 1234
+
+queries:
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m]))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-28T00:00:00Z
+    step_size: 15m
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m])) by (container_name)'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-28T00:00:00Z
+    step_size: 15m
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m])) without (container_name)'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-26T00:00:00Z
+    step_size: 15m
+  - query: 'histogram_quantile(0.9, sum(rate(cortex_cache_value_size_bytes_bucket[5m])) by (le, job))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
+    # two shardable legs
+  - query: 'sum without (instance, job) (rate(cortex_query_frontend_queue_length[5m])) or sum by (job) (rate(cortex_query_frontend_queue_length[5m]))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
+    # one shardable leg
+  - query: 'sum without (instance, job) (rate(cortex_cache_request_duration_seconds_count[5m])) or rate(cortex_cache_request_duration_seconds_count[5m])'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
diff --git a/tools/query-audit/main.go b/tools/query-audit/main.go
new file mode 100644
index 00000000000..20b41380e09
--- /dev/null
+++ b/tools/query-audit/main.go
@@ -0,0 +1,87 @@
+package main
+
+import (
+	"context"
+	"flag"
+	"fmt"
+	"log"
+
+	v1 "github.com/prometheus/client_golang/api/prometheus/v1"
+)
+
+var (
+	configFile string
+)
+
+func init() {
+	flag.StringVar(&configFile, "f", "", "path to config file")
+	flag.Parse()
+	if configFile == "" {
+		log.Fatal(`unset configFile. try "-f <file>"`)
+	}
+}
+
+func main() {
+	var conf Config
+	if err := LoadConfig(configFile, &conf); err != nil {
+		log.Fatal(err)
+	}
+
+	err := Run(conf)
+	if err != nil {
+		log.Fatal(err)
+	}
+}
+
+func Run(conf Config) error {
+	ctlAPI, err := NewAPI(conf.Control)
+	if err != nil {
+		return err
+	}
+
+	tstAPI, err := NewAPI(conf.Test)
+	if err != nil {
+		return err
+	}
+
+	for _, query := range conf.Queries {
+		ctlResp, _, err := ctlAPI.QueryRange(context.Background(), query.Query, v1.Range{
+			Start: query.Start,
+			End:   query.End,
+			Step:  query.StepSize,
+		})
+
+		if err != nil {
+			return err
+		}
+
+		tstResp, _, err := tstAPI.QueryRange(context.Background(), query.Query, v1.Range{
+			Start: query.Start,
+			End:   query.End,
+			Step:  query.StepSize,
+		})
+
+		if err != nil {
+			return err
+		}
+
+		auditor := &Auditor{}
+		diff, err := auditor.Audit(ctlResp, tstResp)
+		if err != nil {
+			return err
+		}
+
+		fmt.Println(fmt.Sprintf(
+			"\n%f%% avg diff for:\n\tquery: %s\n\tseries: %d\n\tsamples: %d\n\tstart: %v\n\tend: %v\n\tstep: %v",
+			diff.Diff*100,
+			query.Query,
+			diff.Series,
+			len(diff.sampleDiffs),
+			query.Start,
+			query.End,
+			query.StepSize,
+		))
+
+	}
+	return nil
+}
diff --git a/tools/query-audit/runner.go b/tools/query-audit/runner.go
new file mode 100644
index 00000000000..e8eadee852d
--- /dev/null
+++ b/tools/query-audit/runner.go
@@ -0,0 +1,32 @@
+package main
+
+import (
+	"net/http"
+
+	"github.com/prometheus/client_golang/api"
+	v1 "github.com/prometheus/client_golang/api/prometheus/v1"
+	"github.com/prometheus/client_golang/prometheus/promhttp"
+)
+
+// NewAPI instantiates a prometheus api
+func NewAPI(backend Backend) (v1.API, error) {
+	config := api.Config{
+		Address: backend.Host,
+	}
+
+	if len(backend.Headers) > 0 {
+		config.RoundTripper = promhttp.RoundTripperFunc(func(req *http.Request) (*http.Response, error) {
+			for key, value := range backend.Headers {
+				req.Header.Add(key, value)
+			}
+			return http.DefaultTransport.RoundTrip(req)
+		})
+	}
+
+	c, err := api.NewClient(config)
+	if err != nil {
+		return nil, err
+	}
+
+	return v1.NewAPI(c), nil
+}

From 5fb7c29198baf970805d7a36b480641a81c2a059 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Fri, 24 Jan 2020 10:51:16 -0500
Subject: [PATCH 02/25] addresses pr comments

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/chunk/storage/caching_index_client.go    |  3 -
 pkg/querier/queryrange/querysharding.go      | 66 ++++++++++----------
 pkg/querier/queryrange/querysharding_test.go |  4 +-
 pkg/querier/queryrange/roundtrip.go          |  5 ++
 4 files changed, 38 insertions(+), 40 deletions(-)

diff --git a/pkg/chunk/storage/caching_index_client.go b/pkg/chunk/storage/caching_index_client.go
index ab74f521784..f1863653b79 100644
--- a/pkg/chunk/storage/caching_index_client.go
+++ b/pkg/chunk/storage/caching_index_client.go
@@ -66,9 +66,6 @@ func (s *cachingIndexClient) Stop() {
 }
 
 func (s *cachingIndexClient) QueryPages(ctx context.Context, queries []chunk.IndexQuery, callback func(chunk.IndexQuery, chunk.ReadBatch) (shouldContinue bool)) error {
-	log, ctx := spanlogger.New(ctx, "cachingIndexClient.QueryPages")
-	defer log.Finish()
-
 	// We cache the entire row, so filter client side.
 	callback = chunk_util.QueryFilter(callback)
 
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index 37db16b8a63..d470e6beec9 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -43,6 +43,23 @@ func (confs ShardingConfigs) ValidRange(start, end int64) (chunk.PeriodConfig, e
 	return chunk.PeriodConfig{}, errInvalidShardingRange
 }
 
+// GetConf will extract a shardable config corresponding to a request and the shardingconfigs
+func (confs ShardingConfigs) GetConf(r Request) (chunk.PeriodConfig, error) {
+	conf, err := confs.ValidRange(r.GetStart(), r.GetEnd())
+
+	// query exists across multiple sharding configs
+	if err != nil {
+		return conf, err
+	}
+
+	// query doesn't have shard factor, so don't try to do AST mapping.
+	if conf.RowShards < 2 {
+		return conf, errors.Errorf("shard factor not high enough: [%d]", conf.RowShards)
+	}
+
+	return conf, nil
+}
+
 func (confs ShardingConfigs) hasShards() bool {
 	for _, conf := range confs {
 		if conf.RowShards > 0 {
@@ -68,9 +85,6 @@ func NewQueryShardMiddleware(
 	codec Codec,
 	minShardingLookback time.Duration,
 ) Middleware {
-	passthrough := MiddlewareFunc(func(next Handler) Handler {
-		return next
-	})
 
 	noshards := !confs.hasShards()
 
@@ -80,38 +94,22 @@ func NewQueryShardMiddleware(
 			"msg", "no configuration with shard found",
 			"confs", fmt.Sprintf("%+v", confs),
 		)
-		return passthrough
-	}
-
-	getConf := func(r Request) (chunk.PeriodConfig, error) {
-		conf, err := confs.ValidRange(r.GetStart(), r.GetEnd())
-
-		// query exists across multiple sharding configs
-		if err != nil {
-			return conf, err
-		}
-
-		// query doesn't have shard factor, so don't try to do AST mapping.
-		if conf.RowShards < 2 {
-			return conf, errors.Errorf("shard factor not high enough: [%d]", conf.RowShards)
-		}
-
-		return conf, nil
+		return PassthroughMiddleware
 	}
 
 	mapperware := MiddlewareFunc(func(next Handler) Handler {
 		return &astMapperware{
-			getConf: getConf,
-			logger:  log.With(logger, "middleware", "QueryShard.astMapperware"),
-			next:    next,
+			confs:  confs,
+			logger: log.With(logger, "middleware", "QueryShard.astMapperware"),
+			next:   next,
 		}
 	})
 
 	shardingware := MiddlewareFunc(func(next Handler) Handler {
 		return &queryShard{
-			getConf: getConf,
-			next:    next,
-			engine:  engine,
+			confs:  confs,
+			next:   next,
+			engine: engine,
 		}
 	})
 
@@ -132,13 +130,13 @@ func NewQueryShardMiddleware(
 }
 
 type astMapperware struct {
-	getConf func(Request) (chunk.PeriodConfig, error)
-	logger  log.Logger
-	next    Handler
+	confs  ShardingConfigs
+	logger log.Logger
+	next   Handler
 }
 
 func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
-	conf, err := ast.getConf(r)
+	conf, err := ast.confs.GetConf(r)
 	// cannot shard with this timerange
 	if err != nil {
 		level.Warn(ast.logger).Log("err", err.Error())
@@ -176,15 +174,15 @@ func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
 }
 
 type queryShard struct {
-	getConf func(Request) (chunk.PeriodConfig, error)
-	next    Handler
-	engine  *promql.Engine
+	confs  ShardingConfigs
+	next   Handler
+	engine *promql.Engine
 }
 
 func (qs *queryShard) Do(ctx context.Context, r Request) (Response, error) {
 	// since there's no available sharding configuration for this time range,
 	// no astmapping has been performed, so skip this middleware.
-	if _, err := qs.getConf(r); err != nil {
+	if _, err := qs.confs.GetConf(r); err != nil {
 		return qs.next.Do(ctx, r)
 	}
 
diff --git a/pkg/querier/queryrange/querysharding_test.go b/pkg/querier/queryrange/querysharding_test.go
index 90d2b176c10..4094a457432 100644
--- a/pkg/querier/queryrange/querysharding_test.go
+++ b/pkg/querier/queryrange/querysharding_test.go
@@ -405,9 +405,7 @@ func TestQueryshardingCorrectness(t *testing.T) {
 
 			mapperware := MiddlewareFunc(func(next Handler) Handler {
 				return &astMapperware{
-					getConf: func(_ Request) (chunk.PeriodConfig, error) {
-						return shardingConf[0], nil
-					},
+					confs:  shardingConf,
 					logger: log.NewNopLogger(),
 					next:   next,
 				}
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index d55db7893fc..eba73d8ac30 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -36,6 +36,11 @@ import (
 
 const day = 24 * time.Hour
 
+// PassthroughMiddleware is a noop middleware
+var PassthroughMiddleware = MiddlewareFunc(func(next Handler) Handler {
+	return next
+})
+
 // Config for query_range middleware chain.
 type Config struct {
 	SplitQueriesByInterval time.Duration `yaml:"split_queries_by_interval"`

From afdd99dc5affca9a571518b2ce794b925676b7ec Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 09:30:53 -0500
Subject: [PATCH 03/25] instruments frontend sharding, splitby

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/astmapper/instrumentation.go    | 12 ++++++++++
 pkg/querier/astmapper/shard_summer.go       |  2 ++
 pkg/querier/queryrange/instrumentation.go   | 26 ++++++++++++++++-----
 pkg/querier/queryrange/querysharding.go     |  1 +
 pkg/querier/queryrange/split_by_interval.go |  1 +
 5 files changed, 36 insertions(+), 6 deletions(-)
 create mode 100644 pkg/querier/astmapper/instrumentation.go

diff --git a/pkg/querier/astmapper/instrumentation.go b/pkg/querier/astmapper/instrumentation.go
new file mode 100644
index 00000000000..39af54e5686
--- /dev/null
+++ b/pkg/querier/astmapper/instrumentation.go
@@ -0,0 +1,12 @@
+package astmapper
+
+import (
+	"github.com/prometheus/client_golang/prometheus"
+	"github.com/prometheus/client_golang/prometheus/promauto"
+)
+
+var shardCounter = promauto.NewCounter(prometheus.CounterOpts{
+	Namespace: "cortex",
+	Name:      "frontend_sharded_queries_total",
+	Help:      "Total number of sharded queries",
+})
diff --git a/pkg/querier/astmapper/shard_summer.go b/pkg/querier/astmapper/shard_summer.go
index 4face8feb16..1a6b7d331f6 100644
--- a/pkg/querier/astmapper/shard_summer.go
+++ b/pkg/querier/astmapper/shard_summer.go
@@ -198,6 +198,8 @@ func (summer *shardSummer) splitSum(
 		)
 	}
 
+	shardCounter.Add(float64(summer.shards))
+
 	return parent, children, nil
 }
 
diff --git a/pkg/querier/queryrange/instrumentation.go b/pkg/querier/queryrange/instrumentation.go
index c55a1b1071e..b73685d93c3 100644
--- a/pkg/querier/queryrange/instrumentation.go
+++ b/pkg/querier/queryrange/instrumentation.go
@@ -8,12 +8,26 @@ import (
 	"github.com/weaveworks/common/instrument"
 )
 
-var queryRangeDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
-	Namespace: "cortex",
-	Name:      "frontend_query_range_duration_seconds",
-	Help:      "Total time spent in seconds doing query range requests.",
-	Buckets:   prometheus.DefBuckets,
-}, []string{"method", "status_code"})
+var (
+	queryRangeDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
+		Namespace: "cortex",
+		Name:      "frontend_query_range_duration_seconds",
+		Help:      "Total time spent in seconds doing query range requests.",
+		Buckets:   prometheus.DefBuckets,
+	}, []string{"method", "status_code"})
+
+	mappedASTCounter = promauto.NewCounter(prometheus.CounterOpts{
+		Namespace: "cortex",
+		Name:      "frontend_mapped_asts_total",
+		Help:      "Total number of queries that have undergone AST mapping",
+	})
+
+	splitByCounter = promauto.NewCounter(prometheus.CounterOpts{
+		Namespace: "cortex",
+		Name:      "frontend_split_queries_total",
+		Help:      "Total number of split (parallelized) request segments",
+	})
+)
 
 // InstrumentMiddleware can be inserted into the middleware chain to expose timing information.
 func InstrumentMiddleware(name string) Middleware {
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index d470e6beec9..daa5979c51d 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -168,6 +168,7 @@ func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
 
 	strMappedQuery := mappedQuery.String()
 	level.Debug(ast.logger).Log("msg", "mapped query", "original", strQuery, "mapped", strMappedQuery)
+	mappedASTCounter.Inc()
 
 	return ast.next.Do(ctx, r.WithQuery(strMappedQuery))
 
diff --git a/pkg/querier/queryrange/split_by_interval.go b/pkg/querier/queryrange/split_by_interval.go
index ff5cd3af174..2dc55d428cb 100644
--- a/pkg/querier/queryrange/split_by_interval.go
+++ b/pkg/querier/queryrange/split_by_interval.go
@@ -28,6 +28,7 @@ func (s splitByInterval) Do(ctx context.Context, r Request) (Response, error) {
 	// First we're going to build new requests, one for each day, taking care
 	// to line up the boundaries with step.
 	reqs := splitQuery(r, s.interval)
+	splitByCounter.Add(float64(len(reqs)))
 
 	reqResps, err := DoRequests(ctx, s.next, reqs, s.limits)
 	if err != nil {

From 6bf5f209338038dc1c783dfa550a1d744d11b4f4 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:02:48 -0500
Subject: [PATCH 04/25] LabelsSeriesID unexported again

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/chunk/schema.go           | 12 ++++++------
 pkg/chunk/schema_util.go      |  3 +--
 pkg/chunk/schema_util_test.go |  2 +-
 3 files changed, 8 insertions(+), 9 deletions(-)

diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index 3ef4506a7d1..bac1830bee4 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -121,7 +121,7 @@ func (s schema) GetCacheKeysAndLabelWriteEntries(from, through model.Time, userI
 		key := strings.Join([]string{
 			bucket.tableName,
 			bucket.hashKey,
-			string(LabelsSeriesID(labels)),
+			string(labelsSeriesID(labels)),
 		},
 			"-",
 		)
@@ -611,7 +611,7 @@ func (v9Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels
 }
 
 func (v9Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := LabelsSeriesID(labels)
+	seriesID := labelsSeriesID(labels)
 
 	entries := []IndexEntry{
 		// Entry for metricName -> seriesID
@@ -641,7 +641,7 @@ func (v9Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels l
 }
 
 func (v9Entries) GetChunkWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := LabelsSeriesID(labels)
+	seriesID := labelsSeriesID(labels)
 	encodedThroughBytes := encodeTime(bucket.through)
 
 	entries := []IndexEntry{
@@ -711,7 +711,7 @@ func (v10Entries) GetWriteEntries(bucket Bucket, metricName string, labels label
 }
 
 func (s v10Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := LabelsSeriesID(labels)
+	seriesID := labelsSeriesID(labels)
 
 	// read first 32 bits of the hash and use this to calculate the shard
 	shard := binary.BigEndian.Uint32(seriesID) % s.rowShards
@@ -744,7 +744,7 @@ func (s v10Entries) GetLabelWriteEntries(bucket Bucket, metricName string, label
 }
 
 func (v10Entries) GetChunkWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := LabelsSeriesID(labels)
+	seriesID := labelsSeriesID(labels)
 	encodedThroughBytes := encodeTime(bucket.through)
 
 	entries := []IndexEntry{
@@ -832,7 +832,7 @@ type v11Entries struct {
 }
 
 func (s v11Entries) GetLabelWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
-	seriesID := LabelsSeriesID(labels)
+	seriesID := labelsSeriesID(labels)
 
 	// read first 32 bits of the hash and use this to calculate the shard
 	shard := binary.BigEndian.Uint32(seriesID) % s.rowShards
diff --git a/pkg/chunk/schema_util.go b/pkg/chunk/schema_util.go
index 3112da100f6..0906288e93f 100644
--- a/pkg/chunk/schema_util.go
+++ b/pkg/chunk/schema_util.go
@@ -47,8 +47,7 @@ func labelsString(ls labels.Labels) string {
 	return b.String()
 }
 
-// LabelsSeriesID hashes a label set
-func LabelsSeriesID(ls labels.Labels) []byte {
+func labelsSeriesID(ls labels.Labels) []byte {
 	h := sha256.Sum256([]byte(labelsString(ls)))
 	return encodeBase64Bytes(h[:])
 }
diff --git a/pkg/chunk/schema_util_test.go b/pkg/chunk/schema_util_test.go
index 3de4b75423b..3e5eb95a3d4 100644
--- a/pkg/chunk/schema_util_test.go
+++ b/pkg/chunk/schema_util_test.go
@@ -38,7 +38,7 @@ func TestLabelSeriesID(t *testing.T) {
 			"RBNvo1WzZ4oRRq0W9+hknpT7T8If536DEMBg9hyq/4o",
 		},
 	} {
-		seriesID := string(LabelsSeriesID(c.lbls))
+		seriesID := string(labelsSeriesID(c.lbls))
 		assert.Equal(t, c.expected, seriesID, labelsString(c.lbls))
 	}
 }

From 3e280143cd3db09224a4ab7a9c969680163cb1d5 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:08:50 -0500
Subject: [PATCH 05/25] removes unnecessary codec interface in astmapping

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/ingester/ingester.go                     |  1 -
 pkg/querier/astmapper/embedded.go            | 18 ++++--------------
 pkg/querier/astmapper/subtree_folder.go      | 17 +++++------------
 pkg/querier/astmapper/subtree_folder_test.go |  2 +-
 4 files changed, 10 insertions(+), 28 deletions(-)

diff --git a/pkg/ingester/ingester.go b/pkg/ingester/ingester.go
index 3f6d586ff69..27eac4652d3 100644
--- a/pkg/ingester/ingester.go
+++ b/pkg/ingester/ingester.go
@@ -436,7 +436,6 @@ func (i *Ingester) Query(ctx context.Context, req *client.QueryRequest) (*client
 	result := &client.QueryResponse{}
 	numSeries, numSamples := 0, 0
 	maxSamplesPerQuery := i.limits.MaxSamplesPerQuery(userID)
-
 	err = state.forSeriesMatching(ctx, matchers, func(ctx context.Context, _ model.Fingerprint, series *memorySeries) error {
 		values, err := series.samplesForRange(from, through)
 		if err != nil {
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index c8adec0b4e6..ac8aeaa73f1 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -4,7 +4,6 @@ import (
 	"encoding/json"
 	"time"
 
-	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 )
@@ -33,7 +32,7 @@ type EmbeddedQueries struct {
 }
 
 // JSONCodec is a Codec impl that uses JSON representations of EmbeddedQueries structs
-var JSONCodec Codec = jsonCodec{}
+var JSONCodec jsonCodec
 
 type jsonCodec struct{}
 
@@ -60,17 +59,8 @@ func (c jsonCodec) Decode(encoded string) (queries []string, err error) {
 	return embedded.Concat, nil
 }
 
-// A Codec is responsible for encoding/decoding queries
-type Codec interface {
-	Encode([]string) string
-	Decode(string) ([]string, error)
-}
-
 // Squash reduces an AST into a single vector or matrix query which can be hijacked by a Queryable impl.
-func Squash(codec Codec, isMatrix bool, nodes ...promql.Node) (promql.Expr, error) {
-	if codec == nil {
-		return nil, errors.Errorf("nil Codec")
-	}
+func Squash(isMatrix bool, nodes ...promql.Node) (promql.Expr, error) {
 
 	// concat OR legs
 	strs := make([]string, 0, len(nodes))
@@ -78,7 +68,7 @@ func Squash(codec Codec, isMatrix bool, nodes ...promql.Node) (promql.Expr, erro
 		strs = append(strs, node.String())
 	}
 
-	encoded := codec.Encode(strs)
+	encoded := JSONCodec.Encode(strs)
 
 	embeddedQuery, err := labels.NewMatcher(labels.MatchEqual, QueryLabel, encoded)
 
@@ -103,7 +93,7 @@ func Squash(codec Codec, isMatrix bool, nodes ...promql.Node) (promql.Expr, erro
 // VectorSquasher always uses a VectorSelector as the substitution node.
 // This is important because logical/set binops can only be applied against vectors and not matrices.
 func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
-	return Squash(JSONCodec, false, nodes...)
+	return Squash(false, nodes...)
 }
 
 // OrSquasher is a custom squasher which mimics the intuitive but less efficient OR'ing of sharded vectors.
diff --git a/pkg/querier/astmapper/subtree_folder.go b/pkg/querier/astmapper/subtree_folder.go
index 3f206cdd331..92da5d8a502 100644
--- a/pkg/querier/astmapper/subtree_folder.go
+++ b/pkg/querier/astmapper/subtree_folder.go
@@ -1,7 +1,6 @@
 package astmapper
 
 import (
-	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/promql"
 )
 
@@ -11,18 +10,12 @@ if it does not contain any previously embedded queries. This allows the frontend
 subtrees of an AST that have not already been parallelized.
 
 */
-type subtreeFolder struct {
-	codec Codec
-}
+type subtreeFolder struct{}
 
-// NewSubtreeFolder creates a subtreeFolder with a specified codec
-func NewSubtreeFolder(codec Codec) (ASTMapper, error) {
-	if codec == nil {
-		return nil, errors.New("nil codec")
-	}
-	return NewASTNodeMapper(&subtreeFolder{
-		codec: JSONCodec,
-	}), nil
+// NewSubtreeFolder creates a subtreeFolder which can reduce an AST
+// to one embedded query if it contains no embedded queries yet
+func NewSubtreeFolder() (ASTMapper, error) {
+	return NewASTNodeMapper(&subtreeFolder{}), nil
 }
 
 // MapNode impls NodeMapper
diff --git a/pkg/querier/astmapper/subtree_folder_test.go b/pkg/querier/astmapper/subtree_folder_test.go
index 0a22619d34c..f81fd1b5d2a 100644
--- a/pkg/querier/astmapper/subtree_folder_test.go
+++ b/pkg/querier/astmapper/subtree_folder_test.go
@@ -96,7 +96,7 @@ func TestSubtreeMapper(t *testing.T) {
 		},
 	} {
 		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
-			mapper, err := NewSubtreeFolder(JSONCodec)
+			mapper, err := NewSubtreeFolder()
 			require.Nil(t, err)
 
 			expr, err := promql.ParseExpr(tc.input)

From 5aa58bc64f72949b0c4c1f0d687c0f1327c6ae97 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:18:56 -0500
Subject: [PATCH 06/25] simplifies VectorSquasher as we never use matrices
 Signed-off-by: Owen Diehl <ow.diehl@gmail.com>

---
 pkg/querier/astmapper/embedded.go | 20 ++++----------------
 1 file changed, 4 insertions(+), 16 deletions(-)

diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index ac8aeaa73f1..de2f2f518e4 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -2,7 +2,6 @@ package astmapper
 
 import (
 	"encoding/json"
-	"time"
 
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
@@ -59,8 +58,10 @@ func (c jsonCodec) Decode(encoded string) (queries []string, err error) {
 	return embedded.Concat, nil
 }
 
-// Squash reduces an AST into a single vector or matrix query which can be hijacked by a Queryable impl.
-func Squash(isMatrix bool, nodes ...promql.Node) (promql.Expr, error) {
+// VectorSquash reduces an AST into a single vector query which can be hijacked by a Queryable impl.
+// It always uses a VectorSelector as the substitution node.
+// This is important because logical/set binops can only be applied against vectors and not matrices.
+func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
 
 	// concat OR legs
 	strs := make([]string, 0, len(nodes))
@@ -76,24 +77,11 @@ func Squash(isMatrix bool, nodes ...promql.Node) (promql.Expr, error) {
 		return nil, err
 	}
 
-	if isMatrix {
-		return &promql.MatrixSelector{
-			Name:          EmbeddedQueryFlag,
-			Range:         time.Minute,
-			LabelMatchers: []*labels.Matcher{embeddedQuery},
-		}, nil
-	}
-
 	return &promql.VectorSelector{
 		Name:          EmbeddedQueryFlag,
 		LabelMatchers: []*labels.Matcher{embeddedQuery},
 	}, nil
-}
 
-// VectorSquasher always uses a VectorSelector as the substitution node.
-// This is important because logical/set binops can only be applied against vectors and not matrices.
-func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
-	return Squash(false, nodes...)
 }
 
 // OrSquasher is a custom squasher which mimics the intuitive but less efficient OR'ing of sharded vectors.

From 26e488beb89d5d3fa76cd25b6ce3ae0b3e3c0ebc Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:20:36 -0500
Subject: [PATCH 07/25] combines queryrange series & value files Signed-off-by:
 Owen Diehl <ow.diehl@gmail.com>

---
 pkg/querier/queryrange/series.go | 55 --------------------------------
 pkg/querier/queryrange/value.go  | 48 ++++++++++++++++++++++++++++
 2 files changed, 48 insertions(+), 55 deletions(-)
 delete mode 100644 pkg/querier/queryrange/series.go

diff --git a/pkg/querier/queryrange/series.go b/pkg/querier/queryrange/series.go
deleted file mode 100644
index 85a7b135531..00000000000
--- a/pkg/querier/queryrange/series.go
+++ /dev/null
@@ -1,55 +0,0 @@
-package queryrange
-
-import (
-	"github.com/cortexproject/cortex/pkg/querier/series"
-	"github.com/pkg/errors"
-	"github.com/prometheus/common/model"
-	"github.com/prometheus/prometheus/pkg/labels"
-	"github.com/prometheus/prometheus/promql"
-	"github.com/prometheus/prometheus/storage"
-)
-
-// ResponseToSamples is needed to map back from api response to the underlying series data
-func ResponseToSamples(resp Response) ([]SampleStream, error) {
-	promRes, ok := resp.(*PrometheusResponse)
-	if !ok {
-		return nil, errors.Errorf("error invalid response type: %T, expected: %T", resp, &PrometheusResponse{})
-	}
-	if promRes.Error != "" {
-		return nil, errors.New(promRes.Error)
-	}
-	switch promRes.Data.ResultType {
-	case promql.ValueTypeVector, promql.ValueTypeMatrix:
-		return promRes.Data.Result, nil
-	}
-
-	return nil, errors.Errorf(
-		"Invalid promql.Value type: [%s]. Only %s and %s supported",
-		promRes.Data.ResultType,
-		promql.ValueTypeVector,
-		promql.ValueTypeMatrix,
-	)
-}
-
-// NewSeriesSet returns an in memory storage.SeriesSet from a []SampleStream
-func NewSeriesSet(results []SampleStream) storage.SeriesSet {
-
-	set := make([]storage.Series, 0, len(results))
-
-	for _, stream := range results {
-		samples := make([]model.SamplePair, 0, len(stream.Samples))
-		for _, sample := range stream.Samples {
-			samples = append(samples, model.SamplePair{
-				Timestamp: model.Time(sample.TimestampMs),
-				Value:     model.SampleValue(sample.Value),
-			})
-		}
-
-		ls := make([]labels.Label, 0, len(stream.Labels))
-		for _, l := range stream.Labels {
-			ls = append(ls, labels.Label(l))
-		}
-		set = append(set, series.NewConcreteSeries(ls, samples))
-	}
-	return series.NewConcreteSeriesSet(set)
-}
diff --git a/pkg/querier/queryrange/value.go b/pkg/querier/queryrange/value.go
index 23f519bff56..c5804637017 100644
--- a/pkg/querier/queryrange/value.go
+++ b/pkg/querier/queryrange/value.go
@@ -2,9 +2,12 @@ package queryrange
 
 import (
 	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/pkg/errors"
+	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
+	"github.com/prometheus/prometheus/storage"
 )
 
 // FromResult transforms a promql query result into a samplestream
@@ -71,3 +74,48 @@ func mapPoints(pts ...promql.Point) []client.Sample {
 
 	return result
 }
+
+// ResponseToSamples is needed to map back from api response to the underlying series data
+func ResponseToSamples(resp Response) ([]SampleStream, error) {
+	promRes, ok := resp.(*PrometheusResponse)
+	if !ok {
+		return nil, errors.Errorf("error invalid response type: %T, expected: %T", resp, &PrometheusResponse{})
+	}
+	if promRes.Error != "" {
+		return nil, errors.New(promRes.Error)
+	}
+	switch promRes.Data.ResultType {
+	case promql.ValueTypeVector, promql.ValueTypeMatrix:
+		return promRes.Data.Result, nil
+	}
+
+	return nil, errors.Errorf(
+		"Invalid promql.Value type: [%s]. Only %s and %s supported",
+		promRes.Data.ResultType,
+		promql.ValueTypeVector,
+		promql.ValueTypeMatrix,
+	)
+}
+
+// NewSeriesSet returns an in memory storage.SeriesSet from a []SampleStream
+func NewSeriesSet(results []SampleStream) storage.SeriesSet {
+
+	set := make([]storage.Series, 0, len(results))
+
+	for _, stream := range results {
+		samples := make([]model.SamplePair, 0, len(stream.Samples))
+		for _, sample := range stream.Samples {
+			samples = append(samples, model.SamplePair{
+				Timestamp: model.Time(sample.TimestampMs),
+				Value:     model.SampleValue(sample.Value),
+			})
+		}
+
+		ls := make([]labels.Label, 0, len(stream.Labels))
+		for _, l := range stream.Labels {
+			ls = append(ls, labels.Label(l))
+		}
+		set = append(set, series.NewConcreteSeries(ls, samples))
+	}
+	return series.NewConcreteSeriesSet(set)
+}

From ba07d5bb76e2ce48f1e0c08f55f7981341b709be Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:35:20 -0500
Subject: [PATCH 08/25] removes noops struct embedding strategy in schema,
 provides noop impls on all schemas instead Signed-off-by: Owen Diehl
 <ow.diehl@gmail.com>

---
 pkg/chunk/schema.go | 47 ++++++++++++++++++++++++---------------------
 1 file changed, 25 insertions(+), 22 deletions(-)

diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index bac1830bee4..a9014efb35a 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -240,20 +240,11 @@ type entries interface {
 	FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery
 }
 
-// noops is a placeholder which can be embedded to provide default implementations
-type noops struct{}
-
-func (n noops) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
-	return queries
-}
-
 // original entries:
 // - hash key: <userid>:<bucket>:<metric name>
 // - range key: <label name>\0<label value>\0<chunk name>
 
-type originalEntries struct {
-	noops
-}
+type originalEntries struct{}
 
 func (originalEntries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -322,6 +313,10 @@ func (originalEntries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery,
 	return nil, ErrNotSupported
 }
 
+func (originalEntries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
+}
+
 // v3Schema went to base64 encoded label values & a version ID
 // - range key: <label name>\0<base64(label value)>\0<chunk name>\0<version 1>
 
@@ -370,9 +365,7 @@ func (base64Entries) GetReadMetricLabelValueQueries(bucket Bucket, metricName st
 //    - range key: \0<base64(label value)>\0<chunk name>\0<version 2>
 // 2) - hash key: <userid>:<hour bucket>:<metric name>
 //    - range key: \0\0<chunk name>\0<version 3>
-type labelNameInHashKeyEntries struct {
-	noops
-}
+type labelNameInHashKeyEntries struct{}
 
 func (labelNameInHashKeyEntries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -443,12 +436,14 @@ func (labelNameInHashKeyEntries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]I
 	return nil, ErrNotSupported
 }
 
+func (labelNameInHashKeyEntries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
+}
+
 // v5 schema is an extension of v4, with the chunk end time in the
 // range key to improve query latency.  However, it did it wrong
 // so the chunk end times are ignored.
-type v5Entries struct {
-	noops
-}
+type v5Entries struct{}
 
 func (v5Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -519,11 +514,13 @@ func (v5Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, error
 	return nil, ErrNotSupported
 }
 
+func (v5Entries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
+}
+
 // v6Entries fixes issues with v5 time encoding being wrong (see #337), and
 // moves label value out of range key (see #199).
-type v6Entries struct {
-	noops
-}
+type v6Entries struct{}
 
 func (v6Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	chunkIDBytes := []byte(chunkID)
@@ -601,11 +598,13 @@ func (v6Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, error
 	return nil, ErrNotSupported
 }
 
-// v9Entries adds a layer of indirection between labels -> series -> chunks.
-type v9Entries struct {
-	noops
+func (v6Entries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
 }
 
+// v9Entries adds a layer of indirection between labels -> series -> chunks.
+type v9Entries struct{}
+
 func (v9Entries) GetWriteEntries(bucket Bucket, metricName string, labels labels.Labels, chunkID string) ([]IndexEntry, error) {
 	return nil, ErrNotSupported
 }
@@ -701,6 +700,10 @@ func (v9Entries) GetLabelNamesForSeries(_ Bucket, _ []byte) ([]IndexQuery, error
 	return nil, ErrNotSupported
 }
 
+func (v9Entries) FilterReadQueries(queries []IndexQuery, shard *astmapper.ShardAnnotation) []IndexQuery {
+	return queries
+}
+
 // v10Entries builds on v9 by sharding index rows to reduce their size.
 type v10Entries struct {
 	rowShards uint32

From 025f87d016ff8cb0c0282ec105f778f8372202ce Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 10:58:09 -0500
Subject: [PATCH 09/25] NewSubtreeFolder no longer can return an error as it
 inlines the jsonCodec Signed-off-by: Owen Diehl <ow.diehl@gmail.com>

---
 pkg/querier/astmapper/subtree_folder.go      | 4 ++--
 pkg/querier/astmapper/subtree_folder_test.go | 3 +--
 pkg/querier/queryrange/querysharding.go      | 5 +----
 3 files changed, 4 insertions(+), 8 deletions(-)

diff --git a/pkg/querier/astmapper/subtree_folder.go b/pkg/querier/astmapper/subtree_folder.go
index 92da5d8a502..d8be4f28564 100644
--- a/pkg/querier/astmapper/subtree_folder.go
+++ b/pkg/querier/astmapper/subtree_folder.go
@@ -14,8 +14,8 @@ type subtreeFolder struct{}
 
 // NewSubtreeFolder creates a subtreeFolder which can reduce an AST
 // to one embedded query if it contains no embedded queries yet
-func NewSubtreeFolder() (ASTMapper, error) {
-	return NewASTNodeMapper(&subtreeFolder{}), nil
+func NewSubtreeFolder() ASTMapper {
+	return NewASTNodeMapper(&subtreeFolder{})
 }
 
 // MapNode impls NodeMapper
diff --git a/pkg/querier/astmapper/subtree_folder_test.go b/pkg/querier/astmapper/subtree_folder_test.go
index f81fd1b5d2a..b30e0d83c4c 100644
--- a/pkg/querier/astmapper/subtree_folder_test.go
+++ b/pkg/querier/astmapper/subtree_folder_test.go
@@ -96,8 +96,7 @@ func TestSubtreeMapper(t *testing.T) {
 		},
 	} {
 		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
-			mapper, err := NewSubtreeFolder()
-			require.Nil(t, err)
+			mapper := NewSubtreeFolder()
 
 			expr, err := promql.ParseExpr(tc.input)
 			require.Nil(t, err)
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index daa5979c51d..eafd31e715d 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -148,10 +148,7 @@ func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
 		return nil, err
 	}
 
-	subtreeFolder, err := astmapper.NewSubtreeFolder(astmapper.JSONCodec)
-	if err != nil {
-		return nil, err
-	}
+	subtreeFolder := astmapper.NewSubtreeFolder()
 
 	strQuery := r.GetQuery()
 	mappedQuery, err := mapQuery(

From 09ac71347fbe1cbffe6f8b5fff834c4e4f95d2fb Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Tue, 28 Jan 2020 15:45:13 -0500
Subject: [PATCH 10/25] account for QueryIngestersWithin renaming
 Signed-off-by: Owen Diehl <ow.diehl@gmail.com>

---
 pkg/cortex/modules.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pkg/cortex/modules.go b/pkg/cortex/modules.go
index 5cc5f065212..7ff7fd808bd 100644
--- a/pkg/cortex/modules.go
+++ b/pkg/cortex/modules.go
@@ -359,7 +359,7 @@ func (t *Cortex) initQueryFrontend(cfg *Config) (err error) {
 			MaxSamples:    cfg.Querier.MaxSamples,
 			Timeout:       cfg.Querier.Timeout,
 		},
-		cfg.Querier.IngesterMaxQueryLookback,
+		cfg.Querier.QueryIngestersWithin,
 	)
 
 	if err != nil {

From dc629c161a6d1185db29aa0ebdc0405e79bc7e41 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Fri, 31 Jan 2020 09:09:52 -0500
Subject: [PATCH 11/25] fixes rebase import collision

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/queryrange/roundtrip.go | 1 -
 1 file changed, 1 deletion(-)

diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index eba73d8ac30..827aa1ee2dd 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -17,7 +17,6 @@ package queryrange
 
 import (
 	"context"
-	"errors"
 	"flag"
 	"net/http"
 	"strings"

From b9a2b6757d2a3a7e815cb6ab1880662039dc51c1 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Mon, 3 Feb 2020 08:33:35 -0500
Subject: [PATCH 12/25] fixes rebase conflicts Signed-off-by: Owen Diehl
 <ow.diehl@gmail.com>

---
 pkg/querier/lazyquery/lazyquery.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pkg/querier/lazyquery/lazyquery.go b/pkg/querier/lazyquery/lazyquery.go
index ba8a43ceaf2..30f85de3bf2 100644
--- a/pkg/querier/lazyquery/lazyquery.go
+++ b/pkg/querier/lazyquery/lazyquery.go
@@ -45,7 +45,7 @@ func NewLazyQuerier(next storage.Querier) storage.Querier {
 }
 
 // Select impls Storage.Querier
-func (l lazyQuerier) Select(params *storage.SelectParams, matchers ...*labels.Matcher) (storage.SeriesSet, storage.Warnings, error) {
+func (l LazyQuerier) Select(params *storage.SelectParams, matchers ...*labels.Matcher) (storage.SeriesSet, storage.Warnings, error) {
 	// make sure there is space in the buffer, to unblock the goroutine and let it die even if nobody is
 	// waiting for the result yet (or anymore).
 	future := make(chan storage.SeriesSet, 1)

From 5ac63090270cd1504561f663d37175d3e92b1cc2 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Mon, 3 Feb 2020 12:46:57 -0500
Subject: [PATCH 13/25] -marks absent as non parallelizable

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/astmapper/parallel.go     | 1 +
 pkg/querier/queryrange/promql_test.go | 3 ---
 2 files changed, 1 insertion(+), 3 deletions(-)

diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
index 5b42f358bcb..e5fe6771b29 100644
--- a/pkg/querier/astmapper/parallel.go
+++ b/pkg/querier/astmapper/parallel.go
@@ -17,6 +17,7 @@ var summableAggregates = map[promql.ItemType]struct{}{
 var nonParallelFuncs = []string{
 	"histogram_quantile",
 	"quantile_over_time",
+	"absent",
 }
 
 // CanParallel tests if a subtree is parallelizable.
diff --git a/pkg/querier/queryrange/promql_test.go b/pkg/querier/queryrange/promql_test.go
index 359d3922862..c8dd34540c3 100644
--- a/pkg/querier/queryrange/promql_test.go
+++ b/pkg/querier/queryrange/promql_test.go
@@ -297,9 +297,6 @@ func Test_FunctionParallelism(t *testing.T) {
 		{
 			fn: "abs",
 		},
-		{
-			fn: "absent",
-		},
 		{
 			fn:           "avg_over_time",
 			isTestMatrix: true,

From ddd47b45b3e887377fa24f617bc3f8c12b686242 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Wed, 5 Feb 2020 10:16:57 -0500
Subject: [PATCH 14/25] upstream promql compatibility changes

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/astmapper/astmapper_test.go |  8 ++++----
 pkg/querier/astmapper/embedded.go       |  2 +-
 pkg/querier/astmapper/parallel.go       | 12 ++++++------
 pkg/querier/astmapper/parallel_test.go  | 12 ++++++------
 pkg/querier/astmapper/shard_summer.go   |  2 +-
 5 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/pkg/querier/astmapper/astmapper_test.go b/pkg/querier/astmapper/astmapper_test.go
index c3f0c0b9f1f..ca90026da91 100644
--- a/pkg/querier/astmapper/astmapper_test.go
+++ b/pkg/querier/astmapper/astmapper_test.go
@@ -18,19 +18,19 @@ func TestCloneNode(t *testing.T) {
 		// simple unmodified case
 		{
 			&promql.BinaryExpr{
-				Op:  promql.ItemADD,
+				Op:  promql.ADD,
 				LHS: &promql.NumberLiteral{Val: 1},
 				RHS: &promql.NumberLiteral{Val: 1},
 			},
 			&promql.BinaryExpr{
-				Op:  promql.ItemADD,
+				Op:  promql.ADD,
 				LHS: &promql.NumberLiteral{Val: 1},
 				RHS: &promql.NumberLiteral{Val: 1},
 			},
 		},
 		{
 			&promql.AggregateExpr{
-				Op:      promql.ItemSum,
+				Op:      promql.SUM,
 				Without: true,
 				Expr: &promql.VectorSelector{
 					Name: "some_metric",
@@ -41,7 +41,7 @@ func TestCloneNode(t *testing.T) {
 				Grouping: []string{"foo"},
 			},
 			&promql.AggregateExpr{
-				Op:      promql.ItemSum,
+				Op:      promql.SUM,
 				Without: true,
 				Expr: &promql.VectorSelector{
 					Name: "some_metric",
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index de2f2f518e4..2bf9afe4497 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -89,7 +89,7 @@ func OrSquasher(nodes ...promql.Node) (promql.Expr, error) {
 	combined := nodes[0]
 	for i := 1; i < len(nodes); i++ {
 		combined = &promql.BinaryExpr{
-			Op:  promql.ItemLOR,
+			Op:  promql.LOR,
 			LHS: combined.(promql.Expr),
 			RHS: nodes[i].(promql.Expr),
 		}
diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
index e5fe6771b29..27d8d532a5a 100644
--- a/pkg/querier/astmapper/parallel.go
+++ b/pkg/querier/astmapper/parallel.go
@@ -6,12 +6,12 @@ import (
 )
 
 var summableAggregates = map[promql.ItemType]struct{}{
-	promql.ItemSum:     {},
-	promql.ItemMin:     {},
-	promql.ItemMax:     {},
-	promql.ItemTopK:    {},
-	promql.ItemBottomK: {},
-	promql.ItemCount:   {},
+	promql.SUM:     {},
+	promql.MIN:     {},
+	promql.MAX:     {},
+	promql.TOPK:    {},
+	promql.BOTTOMK: {},
+	promql.COUNT:   {},
 }
 
 var nonParallelFuncs = []string{
diff --git a/pkg/querier/astmapper/parallel_test.go b/pkg/querier/astmapper/parallel_test.go
index 6032137f57b..890b9c34690 100644
--- a/pkg/querier/astmapper/parallel_test.go
+++ b/pkg/querier/astmapper/parallel_test.go
@@ -18,7 +18,7 @@ func TestCanParallel(t *testing.T) {
 		// simple sum
 		{
 			&promql.AggregateExpr{
-				Op:      promql.ItemSum,
+				Op:      promql.SUM,
 				Without: true,
 				Expr: &promql.VectorSelector{
 					Name: "some_metric",
@@ -39,11 +39,11 @@ func TestCanParallel(t *testing.T) {
 		*/
 		{
 			&promql.AggregateExpr{
-				Op: promql.ItemSum,
+				Op: promql.SUM,
 				Expr: &promql.BinaryExpr{
-					Op: promql.ItemDIV,
+					Op: promql.DIV,
 					LHS: &promql.AggregateExpr{
-						Op:       promql.ItemSum,
+						Op:       promql.SUM,
 						Grouping: []string{"foo"},
 						Expr: &promql.VectorSelector{
 							Name: "idk",
@@ -52,7 +52,7 @@ func TestCanParallel(t *testing.T) {
 							}},
 					},
 					RHS: &promql.AggregateExpr{
-						Op:       promql.ItemSum,
+						Op:       promql.SUM,
 						Grouping: []string{"foo"},
 						Expr: &promql.VectorSelector{
 							Name: "idk",
@@ -67,7 +67,7 @@ func TestCanParallel(t *testing.T) {
 		// sum by (foo) bar1{baz=”blip”}[1m]) ---- this is the first leg of the above
 		{
 			&promql.AggregateExpr{
-				Op:       promql.ItemSum,
+				Op:       promql.SUM,
 				Grouping: []string{"foo"},
 				Expr: &promql.VectorSelector{
 					Name: "idk",
diff --git a/pkg/querier/astmapper/shard_summer.go b/pkg/querier/astmapper/shard_summer.go
index 1a6b7d331f6..533fc13eb20 100644
--- a/pkg/querier/astmapper/shard_summer.go
+++ b/pkg/querier/astmapper/shard_summer.go
@@ -59,7 +59,7 @@ func (summer *shardSummer) MapNode(node promql.Node) (promql.Node, bool, error)
 
 	switch n := node.(type) {
 	case *promql.AggregateExpr:
-		if CanParallel(n) && n.Op == promql.ItemSum {
+		if CanParallel(n) && n.Op == promql.SUM {
 			result, err := summer.shardSum(n)
 			return result, true, err
 		}

From 07e894c4876aaef2f80849dcf422003901417ddd Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Mon, 10 Feb 2020 17:08:03 -0500
Subject: [PATCH 15/25] addresses pr comments Signed-off-by: Owen Diehl
 <ow.diehl@gmail.com>

---
 pkg/chunk/schema.go                        | 14 +++++++++++++-
 pkg/ingester/ingester.go                   |  1 -
 pkg/querier/astmapper/embedded.go          | 13 -------------
 pkg/querier/astmapper/shard_summer_test.go | 16 +++++++++++++++-
 4 files changed, 28 insertions(+), 16 deletions(-)

diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index a9014efb35a..53e930e4086 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -9,9 +9,11 @@ import (
 
 	"strconv"
 
+	"github.com/go-kit/kit/log/level"
 	jsoniter "github.com/json-iterator/go"
 
 	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 )
@@ -822,6 +824,17 @@ func (v10Entries) FilterReadQueries(queries []IndexQuery, shard *astmapper.Shard
 	for _, query := range queries {
 		s := strings.Split(query.HashValue, ":")[0]
 		n, err := strconv.Atoi(s)
+		if err != nil {
+			level.Error(util.Logger).Log(
+				"msg",
+				"Unable to determine shard from IndexQuery",
+				"HashValue",
+				query.HashValue,
+				"schema",
+				"v10",
+			)
+		}
+
 		if err == nil && n == shard.Shard {
 			matches = append(matches, query)
 		}
@@ -892,5 +905,4 @@ func (v11Entries) GetLabelNamesForSeries(bucket Bucket, seriesID []byte) ([]Inde
 			HashValue: string(seriesID),
 		},
 	}, nil
-
 }
diff --git a/pkg/ingester/ingester.go b/pkg/ingester/ingester.go
index 27eac4652d3..dcd52a9baec 100644
--- a/pkg/ingester/ingester.go
+++ b/pkg/ingester/ingester.go
@@ -518,7 +518,6 @@ func (i *Ingester) QueryStream(req *client.QueryRequest, stream client.Ingester_
 		}
 
 		numChunks += len(wireChunks)
-
 		batch = append(batch, client.TimeSeriesChunk{
 			Labels: client.FromLabelsToLabelAdapters(series.metric),
 			Chunks: wireChunks,
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index 2bf9afe4497..6c50564ab47 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -83,16 +83,3 @@ func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
 	}, nil
 
 }
-
-// OrSquasher is a custom squasher which mimics the intuitive but less efficient OR'ing of sharded vectors.
-func OrSquasher(nodes ...promql.Node) (promql.Expr, error) {
-	combined := nodes[0]
-	for i := 1; i < len(nodes); i++ {
-		combined = &promql.BinaryExpr{
-			Op:  promql.LOR,
-			LHS: combined.(promql.Expr),
-			RHS: nodes[i].(promql.Expr),
-		}
-	}
-	return combined.(promql.Expr), nil
-}
diff --git a/pkg/querier/astmapper/shard_summer_test.go b/pkg/querier/astmapper/shard_summer_test.go
index 9182e2d87ac..a76fcb79560 100644
--- a/pkg/querier/astmapper/shard_summer_test.go
+++ b/pkg/querier/astmapper/shard_summer_test.go
@@ -9,6 +9,20 @@ import (
 	"github.com/stretchr/testify/require"
 )
 
+// orSquasher is a custom squasher which mimics the intuitive but less efficient OR'ing of sharded vectors.
+// It's helpful for tests because of its intuitive & human readable output.
+func orSquasher(nodes ...promql.Node) (promql.Expr, error) {
+	combined := nodes[0]
+	for i := 1; i < len(nodes); i++ {
+		combined = &promql.BinaryExpr{
+			Op:  promql.LOR,
+			LHS: combined.(promql.Expr),
+			RHS: nodes[i].(promql.Expr),
+		}
+	}
+	return combined.(promql.Expr), nil
+}
+
 func TestShardSummer(t *testing.T) {
 	var testExpr = []struct {
 		shards   int
@@ -106,7 +120,7 @@ func TestShardSummer(t *testing.T) {
 	for i, c := range testExpr {
 		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
 
-			summer, err := NewShardSummer(c.shards, OrSquasher)
+			summer, err := NewShardSummer(c.shards, orSquasher)
 			require.Nil(t, err)
 			expr, err := promql.ParseExpr(c.input)
 			require.Nil(t, err)

From 4c6f40bcafc5ffe1264a96718cf87d595f50b5e6 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Mon, 10 Feb 2020 17:33:44 -0500
Subject: [PATCH 16/25] import collisions

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/chunk_tar_test.go            | 5 +----
 pkg/querier/lazyquery/lazyquery.go       | 3 +--
 pkg/querier/queryrange/roundtrip_test.go | 3 +--
 pkg/querier/remote_read_test.go          | 3 +--
 4 files changed, 4 insertions(+), 10 deletions(-)

diff --git a/pkg/querier/chunk_tar_test.go b/pkg/querier/chunk_tar_test.go
index 275cb1e36a2..bfc2a974af7 100644
--- a/pkg/querier/chunk_tar_test.go
+++ b/pkg/querier/chunk_tar_test.go
@@ -11,10 +11,6 @@ import (
 	"testing"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
-	"github.com/cortexproject/cortex/pkg/querier/batch"
-	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
-	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
@@ -22,6 +18,7 @@ import (
 
 	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/querier/batch"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/cortexproject/cortex/pkg/util"
 )
 
diff --git a/pkg/querier/lazyquery/lazyquery.go b/pkg/querier/lazyquery/lazyquery.go
index 30f85de3bf2..1a19d65e1df 100644
--- a/pkg/querier/lazyquery/lazyquery.go
+++ b/pkg/querier/lazyquery/lazyquery.go
@@ -4,13 +4,12 @@ import (
 	"context"
 	"fmt"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
-	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/storage"
 
 	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 )
 
 // LazyQueryable wraps a storage.Queryable
diff --git a/pkg/querier/queryrange/roundtrip_test.go b/pkg/querier/queryrange/roundtrip_test.go
index 65e04e1e5c7..082cfdb3572 100644
--- a/pkg/querier/queryrange/roundtrip_test.go
+++ b/pkg/querier/queryrange/roundtrip_test.go
@@ -10,14 +10,13 @@ import (
 	"testing"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
-	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/go-kit/kit/log"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
 	"github.com/weaveworks/common/middleware"
 	"github.com/weaveworks/common/user"
 
+	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/util"
 )
 
diff --git a/pkg/querier/remote_read_test.go b/pkg/querier/remote_read_test.go
index 9f4fea14439..f12c2460d89 100644
--- a/pkg/querier/remote_read_test.go
+++ b/pkg/querier/remote_read_test.go
@@ -9,8 +9,6 @@ import (
 	"net/http/httptest"
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/ingester/client"
-	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/gogo/protobuf/proto"
 	"github.com/golang/snappy"
 	"github.com/prometheus/common/model"
@@ -19,6 +17,7 @@ import (
 	"github.com/stretchr/testify/require"
 
 	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 )
 
 func TestRemoteReadHandler(t *testing.T) {

From 42851ff9ac1f007c818dc9e6601b4fcb4f927874 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Mon, 10 Feb 2020 18:24:18 -0500
Subject: [PATCH 17/25] linting - fixes goimports -local requirement

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/chunk/chunk.go                           | 3 +--
 pkg/chunk/schema.go                          | 4 ++--
 pkg/chunk/schema_test.go                     | 3 ++-
 pkg/querier/chunkstore/chunkstore.go         | 3 ++-
 pkg/querier/queryrange/promql_test.go        | 5 +++--
 pkg/querier/queryrange/queryable.go          | 3 ++-
 pkg/querier/queryrange/queryable_test.go     | 5 +++--
 pkg/querier/queryrange/querysharding.go      | 7 ++++---
 pkg/querier/queryrange/querysharding_test.go | 7 ++++---
 pkg/querier/queryrange/series_test.go        | 3 ++-
 pkg/querier/queryrange/test_utils.go         | 5 +++--
 pkg/querier/queryrange/test_utils_test.go    | 3 ++-
 pkg/querier/queryrange/value.go              | 5 +++--
 pkg/querier/queryrange/value_test.go         | 3 ++-
 14 files changed, 35 insertions(+), 24 deletions(-)

diff --git a/pkg/chunk/chunk.go b/pkg/chunk/chunk.go
index 295da5d84ec..417b60a6ada 100644
--- a/pkg/chunk/chunk.go
+++ b/pkg/chunk/chunk.go
@@ -14,11 +14,10 @@ import (
 	"github.com/pkg/errors"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
+	errs "github.com/weaveworks/common/errors"
 
 	prom_chunk "github.com/cortexproject/cortex/pkg/chunk/encoding"
 	"github.com/cortexproject/cortex/pkg/prom1/storage/metric"
-
-	errs "github.com/weaveworks/common/errors"
 )
 
 // Errors that decode can return
diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index 53e930e4086..26f25d1f649 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -11,11 +11,11 @@ import (
 
 	"github.com/go-kit/kit/log/level"
 	jsoniter "github.com/json-iterator/go"
+	"github.com/prometheus/common/model"
+	"github.com/prometheus/prometheus/pkg/labels"
 
 	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/cortexproject/cortex/pkg/util"
-	"github.com/prometheus/common/model"
-	"github.com/prometheus/prometheus/pkg/labels"
 )
 
 const (
diff --git a/pkg/chunk/schema_test.go b/pkg/chunk/schema_test.go
index c697e321677..0393b118ee5 100644
--- a/pkg/chunk/schema_test.go
+++ b/pkg/chunk/schema_test.go
@@ -8,13 +8,14 @@ import (
 	"sort"
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	jsoniter "github.com/json-iterator/go"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
 	"github.com/weaveworks/common/test"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 )
 
 type ByHashRangeKey []IndexEntry
diff --git a/pkg/querier/chunkstore/chunkstore.go b/pkg/querier/chunkstore/chunkstore.go
index 3b1045ef0d6..754ae0a9544 100644
--- a/pkg/querier/chunkstore/chunkstore.go
+++ b/pkg/querier/chunkstore/chunkstore.go
@@ -3,9 +3,10 @@ package chunkstore
 import (
 	"context"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
 )
 
 // ChunkStore is the read-interface to the Chunk Store.  Made an interface here
diff --git a/pkg/querier/queryrange/promql_test.go b/pkg/querier/queryrange/promql_test.go
index c8dd34540c3..ded2cc12416 100644
--- a/pkg/querier/queryrange/promql_test.go
+++ b/pkg/querier/queryrange/promql_test.go
@@ -9,13 +9,14 @@ import (
 	"testing"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
-	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/prometheus/client_golang/prometheus"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/prometheus/prometheus/storage"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/util"
 )
 
 var (
diff --git a/pkg/querier/queryrange/queryable.go b/pkg/querier/queryrange/queryable.go
index 14a2ed7b073..2c5d6db02f0 100644
--- a/pkg/querier/queryrange/queryable.go
+++ b/pkg/querier/queryrange/queryable.go
@@ -3,10 +3,11 @@ package queryrange
 import (
 	"context"
 
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/storage"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 )
 
 const (
diff --git a/pkg/querier/queryrange/queryable_test.go b/pkg/querier/queryrange/queryable_test.go
index d056bc37dca..5b42ec9fbf6 100644
--- a/pkg/querier/queryrange/queryable_test.go
+++ b/pkg/querier/queryrange/queryable_test.go
@@ -4,12 +4,13 @@ import (
 	"context"
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/ingester/client"
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 )
 
 func TestSelect(t *testing.T) {
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index eafd31e715d..9ad17989a95 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -5,13 +5,14 @@ import (
 	fmt "fmt"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
-	"github.com/cortexproject/cortex/pkg/querier/lazyquery"
 	"github.com/go-kit/kit/log"
 	"github.com/go-kit/kit/log/level"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/promql"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/querier/lazyquery"
 )
 
 var (
diff --git a/pkg/querier/queryrange/querysharding_test.go b/pkg/querier/queryrange/querysharding_test.go
index 4094a457432..d57c7b0e969 100644
--- a/pkg/querier/queryrange/querysharding_test.go
+++ b/pkg/querier/queryrange/querysharding_test.go
@@ -8,15 +8,16 @@ import (
 	"testing"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/chunk"
-	"github.com/cortexproject/cortex/pkg/ingester/client"
-	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/go-kit/kit/log"
 	"github.com/pkg/errors"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/prometheus/prometheus/storage"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/chunk"
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/util"
 )
 
 func TestQueryshardingMiddleware(t *testing.T) {
diff --git a/pkg/querier/queryrange/series_test.go b/pkg/querier/queryrange/series_test.go
index 262503e8538..1523db47883 100644
--- a/pkg/querier/queryrange/series_test.go
+++ b/pkg/querier/queryrange/series_test.go
@@ -3,9 +3,10 @@ package queryrange
 import (
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/ingester/client"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
 )
 
 func Test_ResponseToSamples(t *testing.T) {
diff --git a/pkg/querier/queryrange/test_utils.go b/pkg/querier/queryrange/test_utils.go
index 0eb68a394b3..400b0eef71a 100644
--- a/pkg/querier/queryrange/test_utils.go
+++ b/pkg/querier/queryrange/test_utils.go
@@ -5,12 +5,13 @@ import (
 	"fmt"
 	"time"
 
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
-	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/pkg/errors"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/storage"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 )
 
 // genLabels will create a slice of labels where each label has an equal chance to occupy a value from [0,labelBuckets]. It returns a slice of length labelBuckets^len(labelSet)
diff --git a/pkg/querier/queryrange/test_utils_test.go b/pkg/querier/queryrange/test_utils_test.go
index 8e5f187b927..3deda66e400 100644
--- a/pkg/querier/queryrange/test_utils_test.go
+++ b/pkg/querier/queryrange/test_utils_test.go
@@ -5,9 +5,10 @@ import (
 	"sort"
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 )
 
 func TestGenLabelsCorrectness(t *testing.T) {
diff --git a/pkg/querier/queryrange/value.go b/pkg/querier/queryrange/value.go
index c5804637017..ce3c0edcbe6 100644
--- a/pkg/querier/queryrange/value.go
+++ b/pkg/querier/queryrange/value.go
@@ -1,13 +1,14 @@
 package queryrange
 
 import (
-	"github.com/cortexproject/cortex/pkg/ingester/client"
-	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/pkg/errors"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/prometheus/prometheus/storage"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
+	"github.com/cortexproject/cortex/pkg/querier/series"
 )
 
 // FromResult transforms a promql query result into a samplestream
diff --git a/pkg/querier/queryrange/value_test.go b/pkg/querier/queryrange/value_test.go
index 524c2e83d90..00bfb7447c5 100644
--- a/pkg/querier/queryrange/value_test.go
+++ b/pkg/querier/queryrange/value_test.go
@@ -4,11 +4,12 @@ import (
 	"fmt"
 	"testing"
 
-	"github.com/cortexproject/cortex/pkg/ingester/client"
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/pkg/labels"
 	"github.com/prometheus/prometheus/promql"
 	"github.com/stretchr/testify/require"
+
+	"github.com/cortexproject/cortex/pkg/ingester/client"
 )
 
 func TestFromValue(t *testing.T) {

From 7347d45d6a0ef12e7c3515ede208637dd53a5922 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Wed, 19 Feb 2020 17:39:18 -0500
Subject: [PATCH 18/25] fixes merge conflicts

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/block.go                 | 5 +++--
 pkg/querier/distributor_queryable.go | 4 ++--
 pkg/querier/lazyquery/lazyquery.go   | 4 ++++
 pkg/querier/querier.go               | 5 +++--
 4 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/pkg/querier/block.go b/pkg/querier/block.go
index acdf5a7d0c2..7a56813ea95 100644
--- a/pkg/querier/block.go
+++ b/pkg/querier/block.go
@@ -18,6 +18,7 @@ import (
 	"github.com/weaveworks/common/user"
 	"google.golang.org/grpc/metadata"
 
+	"github.com/cortexproject/cortex/pkg/querier/series"
 	"github.com/cortexproject/cortex/pkg/storage/tsdb"
 	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/cortexproject/cortex/pkg/util/spanlogger"
@@ -244,7 +245,7 @@ func (bqs *blockQuerierSeries) Labels() labels.Labels {
 func (bqs *blockQuerierSeries) Iterator() storage.SeriesIterator {
 	if len(bqs.chunks) == 0 {
 		// should not happen in practice, but we have a unit test for it
-		return errIterator{err: errors.New("no chunks")}
+		return series.NewErrIterator(errors.New("no chunks"))
 	}
 
 	its := make([]chunkenc.Iterator, 0, len(bqs.chunks))
@@ -252,7 +253,7 @@ func (bqs *blockQuerierSeries) Iterator() storage.SeriesIterator {
 	for _, c := range bqs.chunks {
 		ch, err := chunkenc.FromData(chunkenc.EncXOR, c.Raw.Data)
 		if err != nil {
-			return errIterator{err: errors.Wrapf(err, "failed to initialize chunk from XOR encoded raw data (series: %v min time: %d max time: %d)", bqs.Labels(), c.MinTime, c.MaxTime)}
+			return series.NewErrIterator(errors.Wrapf(err, "failed to initialize chunk from XOR encoded raw data (series: %v min time: %d max time: %d)", bqs.Labels(), c.MinTime, c.MaxTime))
 		}
 
 		it := ch.Iterator(nil)
diff --git a/pkg/querier/distributor_queryable.go b/pkg/querier/distributor_queryable.go
index 6cffd9fe7c5..25961025912 100644
--- a/pkg/querier/distributor_queryable.go
+++ b/pkg/querier/distributor_queryable.go
@@ -55,7 +55,7 @@ func (q *distributorQuerier) Select(sp *storage.SelectParams, matchers ...*label
 		if err != nil {
 			return nil, nil, err
 		}
-		return metricsToSeriesSet(ms), nil, nil
+		return series.MetricsToSeriesSet(ms), nil, nil
 	}
 
 	mint, maxt := sp.Start, sp.End
@@ -108,7 +108,7 @@ func (q *distributorQuerier) streamingSelect(sp storage.SelectParams, matchers [
 		serieses = append(serieses, series)
 	}
 
-	return newConcreteSeriesSet(serieses), nil, nil
+	return series.NewConcreteSeriesSet(serieses), nil, nil
 }
 
 func (q *distributorQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
diff --git a/pkg/querier/lazyquery/lazyquery.go b/pkg/querier/lazyquery/lazyquery.go
index 1a19d65e1df..ba6531f74f0 100644
--- a/pkg/querier/lazyquery/lazyquery.go
+++ b/pkg/querier/lazyquery/lazyquery.go
@@ -86,6 +86,10 @@ func (l LazyQuerier) Get(ctx context.Context, userID string, from, through model
 	return store.Get(ctx, userID, from, through, matchers...)
 }
 
+func NewErrSeriesSet(err error) storage.SeriesSet {
+	return errSeriesSet{err}
+}
+
 // errSeriesSet implements storage.SeriesSet, just returning an error.
 type errSeriesSet struct {
 	err error
diff --git a/pkg/querier/querier.go b/pkg/querier/querier.go
index 6a1e8bdcc5f..63120f442ea 100644
--- a/pkg/querier/querier.go
+++ b/pkg/querier/querier.go
@@ -14,6 +14,7 @@ import (
 
 	"github.com/cortexproject/cortex/pkg/chunk"
 	"github.com/cortexproject/cortex/pkg/querier/batch"
+	"github.com/cortexproject/cortex/pkg/querier/chunkstore"
 	"github.com/cortexproject/cortex/pkg/querier/iterators"
 	"github.com/cortexproject/cortex/pkg/querier/lazyquery"
 	"github.com/cortexproject/cortex/pkg/util"
@@ -84,7 +85,7 @@ func getChunksIteratorFunction(cfg Config) chunkIteratorFunc {
 	return mergeChunks
 }
 
-func NewChunkStoreQueryable(cfg Config, chunkStore ChunkStore) storage.Queryable {
+func NewChunkStoreQueryable(cfg Config, chunkStore chunkstore.ChunkStore) storage.Queryable {
 	return newChunkStoreQueryable(chunkStore, getChunksIteratorFunction(cfg))
 }
 
@@ -234,7 +235,7 @@ func (q querier) mergeSeriesSets(sets []storage.SeriesSet) storage.SeriesSet {
 			// If there is error, we better report it.
 			err := set.Err()
 			if err != nil {
-				otherSets = append(otherSets, errSeriesSet{err: err})
+				otherSets = append(otherSets, lazyquery.NewErrSeriesSet(err))
 			}
 			continue
 		}

From 10dd5972bfacf9ea354280b4dbb75a7802f5b0c3 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Wed, 19 Feb 2020 19:02:46 -0500
Subject: [PATCH 19/25] addresses pr comments

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 CHANGELOG.md                              | 21 +++++++++---------
 docs/configuration/arguments.md           |  4 +++-
 pkg/chunk/chunk_store_utils.go            |  8 -------
 pkg/chunk/schema_config.go                |  8 -------
 pkg/chunk/series_store.go                 | 11 ++++++++++
 pkg/querier/astmapper/embedded.go         | 20 ++++++++---------
 pkg/querier/astmapper/parallel.go         |  8 +++++--
 pkg/querier/astmapper/subtree_folder.go   |  4 ++--
 pkg/querier/queryrange/instrumentation.go |  2 +-
 pkg/querier/queryrange/queryable.go       |  2 +-
 pkg/querier/queryrange/queryable_test.go  | 26 +++++++++++++++--------
 pkg/querier/queryrange/querysharding.go   |  6 ++----
 pkg/querier/queryrange/roundtrip.go       | 14 +++++++-----
 pkg/querier/queryrange/roundtrip_test.go  |  2 +-
 14 files changed, 72 insertions(+), 64 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index eb23843f300..09cdf7eb584 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,16 @@
 
 ## master / unreleased
 
+* [FEATURE] Fan out parallelizable queries to backend queriers concurrently. #1878
+  * `-querier.sum-shards` (bool)
+  * Requires a shard-compatible schema (v10+)
+  * This causes the number of traces to increase accordingly.
+  * The query-frontend now requires a schema config to determine how/when to shard queries, either from a file or from flags (i.e. by the `config-yaml` CLI flag). This is the same schema config the queriers consume. The schema is only required to use this option.
+  * It's also advised to increase downstream concurrency controls as well:
+    * `querier.max-outstanding-requests-per-tenant`
+    * `querier.max-query-parallelism`
+    * `querier.max-concurrent`
+    * `server.grpc-max-concurrent-streams` (for both query-frontends and queriers)
 * [CHANGE] The frontend http server will now send 502 in case of deadline exceeded and 499 if the user requested cancellation. #2156
 * [CHANGE] Config file changed to remove top level `config_store` field in favor of a nested `configdb` field. #2125
 * [CHANGE] Removed unnecessary `frontend.cache-split-interval` in favor of `querier.split-queries-by-interval` both to reduce configuration complexity and guarantee alignment of these two configs. Starting from now, `-querier.cache-results` may only be enabled in conjunction with `-querier.split-queries-by-interval` (previously the cache interval default was `24h` so if you want to preserve the same behaviour you should set `-querier.split-queries-by-interval=24h`). #2040
@@ -62,17 +72,6 @@ Note that the ruler flags need to be changed in this upgrade. You're moving from
 Further, if you're using the configs service, we've upgraded the migration library and this requires some manual intervention. See full instructions below to upgrade your PostgreSQL.
 
 * [CHANGE] The frontend component now does not cache results if it finds a `Cache-Control` header and if one of its values is `no-store`. #1974
-* [FEATURE] Fan out parallelizable queries to backend queriers concurrently.
-  * `-querier.sum-shards` (bool)
-  * Requires a shard-compatible schema (v10+)
-  * This causes the number of traces to increase accordingly.
-  * The query-frontend now requires a schema config to determine how/when to shard queries, either from a file or from flags (i.e. by the `config-yaml` CLI flag). This is the same schema config the queriers consume.
-  * It's also advised to increase downstream concurrency controls as well:
-    * `querier.max-outstanding-requests-per-tenant`
-    * `querier.max-query-parallelism`
-    * `querier.max-concurrent`
-    * `server.grpc-max-concurrent-streams` (for both query-frontends and queriers)
-* [ENHANCEMENT] metric `cortex_ingester_flush_reasons` gets a new `reason` value: `Spread`, when `-ingester.spread-flushes` option is enabled.
 * [CHANGE] Flags changed with transition to upstream Prometheus rules manager:
   * `-ruler.client-timeout` is now `ruler.configs.client-timeout` in order to match `ruler.configs.url`.
   * `-ruler.group-timeout`has been removed.
diff --git a/docs/configuration/arguments.md b/docs/configuration/arguments.md
index 3508f838ce4..266c1b28059 100644
--- a/docs/configuration/arguments.md
+++ b/docs/configuration/arguments.md
@@ -86,9 +86,11 @@ The ingester query API was improved over time, but defaults to the old behaviour
    - `querier.max-outstanding-requests-per-tenant`
    - `querier.max-query-parallelism`
    - `querier.max-concurrent`
+   - `server.grpc-max-concurrent-streams` (for both query-frontends and queriers)
+
    Furthermore, both querier and query-frontend components require the `querier.query-ingesters-within` parameter to know when to start sharding requests (ingester queries are not sharded). It's recommended to align this with `ingester.max-chunk-age`.
 
-   Instrumentation (traces) also scale with the number of sharded queries and it's suggested to account for increased throughput there as well.
+   Instrumentation (traces) also scale with the number of sharded queries and it's suggested to account for increased throughput there as well (for instance via `JAEGER_REPORTER_MAX_QUEUE_SIZE`).
 
 - `-querier.align-querier-with-step`
 
diff --git a/pkg/chunk/chunk_store_utils.go b/pkg/chunk/chunk_store_utils.go
index 948ee40e181..27a5a84fe97 100644
--- a/pkg/chunk/chunk_store_utils.go
+++ b/pkg/chunk/chunk_store_utils.go
@@ -10,7 +10,6 @@ import (
 	"github.com/prometheus/prometheus/promql"
 
 	"github.com/cortexproject/cortex/pkg/chunk/cache"
-	"github.com/cortexproject/cortex/pkg/querier/astmapper"
 	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/cortexproject/cortex/pkg/util/spanlogger"
 )
@@ -256,10 +255,3 @@ func (c *Fetcher) processCacheResponse(ctx context.Context, chunks []Chunk, keys
 	}
 	return found, missing, err
 }
-
-func injectShardLabels(chunks []Chunk, shard astmapper.ShardAnnotation) {
-	for i, chunk := range chunks {
-		chunk.Metric = append(chunk.Metric, shard.Label())
-		chunks[i] = chunk
-	}
-}
diff --git a/pkg/chunk/schema_config.go b/pkg/chunk/schema_config.go
index b03de6f6c6e..4d794f7a8ed 100644
--- a/pkg/chunk/schema_config.go
+++ b/pkg/chunk/schema_config.go
@@ -317,14 +317,6 @@ func (cfg *SchemaConfig) Load() error {
 		return err
 	}
 
-	for i, periodCfg := range cfg.Configs {
-		// apply default row shards
-		if periodCfg.RowShards == 0 {
-			periodCfg.RowShards = defaultRowShards(periodCfg.Schema)
-			cfg.Configs[i] = periodCfg
-		}
-	}
-
 	return cfg.Validate()
 }
 
diff --git a/pkg/chunk/series_store.go b/pkg/chunk/series_store.go
index 13021d78daf..a41f8ea4047 100644
--- a/pkg/chunk/series_store.go
+++ b/pkg/chunk/series_store.go
@@ -534,3 +534,14 @@ func (c *seriesStore) calculateIndexEntries(ctx context.Context, from, through m
 
 	return result, missing, nil
 }
+
+func injectShardLabels(chunks []Chunk, shard astmapper.ShardAnnotation) {
+	for i, chunk := range chunks {
+
+		b := labels.NewBuilder(chunk.Metric)
+		l := shard.Label()
+		b.Set(l.Name, l.Value)
+		chunk.Metric = b.Labels()
+		chunks[i] = chunk
+	}
+}
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index 6c50564ab47..645e4fc3866 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -21,8 +21,8 @@ be remapped into vector or matrix selectors utilizing a reserved label containin
 const (
 	// QueryLabel is a reserved label containing an embedded query
 	QueryLabel = "__cortex_queries__"
-	// EmbeddedQueryFlag is a reserved label (metric name) denoting an embedded query
-	EmbeddedQueryFlag = "__embedded_queries__"
+	// EmbeddedQueriesMetricName is a reserved label (metric name) denoting an embedded query
+	EmbeddedQueriesMetricName = "__embedded_queries__"
 )
 
 // EmbeddedQueries is a wrapper type for encoding queries
@@ -35,17 +35,12 @@ var JSONCodec jsonCodec
 
 type jsonCodec struct{}
 
-func (c jsonCodec) Encode(queries []string) string {
+func (c jsonCodec) Encode(queries []string) (string, error) {
 	embedded := EmbeddedQueries{
 		Concat: queries,
 	}
 	b, err := json.Marshal(embedded)
-
-	if err != nil {
-		panic(err)
-	}
-
-	return string(b)
+	return string(b), err
 }
 
 func (c jsonCodec) Decode(encoded string) (queries []string, err error) {
@@ -69,7 +64,10 @@ func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
 		strs = append(strs, node.String())
 	}
 
-	encoded := JSONCodec.Encode(strs)
+	encoded, err := JSONCodec.Encode(strs)
+	if err != nil {
+		return nil, err
+	}
 
 	embeddedQuery, err := labels.NewMatcher(labels.MatchEqual, QueryLabel, encoded)
 
@@ -78,7 +76,7 @@ func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
 	}
 
 	return &promql.VectorSelector{
-		Name:          EmbeddedQueryFlag,
+		Name:          EmbeddedQueriesMetricName,
 		LabelMatchers: []*labels.Matcher{embeddedQuery},
 	}, nil
 
diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
index 27d8d532a5a..1ee6fef0ed5 100644
--- a/pkg/querier/astmapper/parallel.go
+++ b/pkg/querier/astmapper/parallel.go
@@ -1,7 +1,10 @@
 package astmapper
 
 import (
-	"github.com/pkg/errors"
+	"fmt"
+
+	"github.com/cortexproject/cortex/pkg/util"
+	"github.com/go-kit/kit/log/level"
 	"github.com/prometheus/prometheus/promql"
 )
 
@@ -76,7 +79,8 @@ func CanParallel(node promql.Node) bool {
 		return true
 
 	default:
-		panic(errors.Errorf("CanParallel: unhandled node type %T", node))
+		level.Error(util.Logger).Log("err", fmt.Sprintf("CanParallel: unhandled node type %T", node))
+		return false
 	}
 
 }
diff --git a/pkg/querier/astmapper/subtree_folder.go b/pkg/querier/astmapper/subtree_folder.go
index d8be4f28564..8eb66e25805 100644
--- a/pkg/querier/astmapper/subtree_folder.go
+++ b/pkg/querier/astmapper/subtree_folder.go
@@ -42,12 +42,12 @@ func (f *subtreeFolder) MapNode(node promql.Node) (promql.Node, bool, error) {
 func isEmbedded(node promql.Node) (bool, error) {
 	switch n := node.(type) {
 	case *promql.VectorSelector:
-		if n.Name == EmbeddedQueryFlag {
+		if n.Name == EmbeddedQueriesMetricName {
 			return true, nil
 		}
 
 	case *promql.MatrixSelector:
-		if n.Name == EmbeddedQueryFlag {
+		if n.Name == EmbeddedQueriesMetricName {
 			return true, nil
 		}
 
diff --git a/pkg/querier/queryrange/instrumentation.go b/pkg/querier/queryrange/instrumentation.go
index b73685d93c3..f40fd971dbc 100644
--- a/pkg/querier/queryrange/instrumentation.go
+++ b/pkg/querier/queryrange/instrumentation.go
@@ -25,7 +25,7 @@ var (
 	splitByCounter = promauto.NewCounter(prometheus.CounterOpts{
 		Namespace: "cortex",
 		Name:      "frontend_split_queries_total",
-		Help:      "Total number of split (parallelized) request segments",
+		Help:      "Total number of underlying query requests after the split by interval is applied",
 	})
 )
 
diff --git a/pkg/querier/queryrange/queryable.go b/pkg/querier/queryrange/queryable.go
index 2c5d6db02f0..e3881512b36 100644
--- a/pkg/querier/queryrange/queryable.go
+++ b/pkg/querier/queryrange/queryable.go
@@ -41,7 +41,7 @@ func (q *DownstreamQuerier) Select(
 	var embeddedQuery string
 	var isEmbedded bool
 	for _, matcher := range matchers {
-		if matcher.Name == labels.MetricName && matcher.Value == astmapper.EmbeddedQueryFlag {
+		if matcher.Name == labels.MetricName && matcher.Value == astmapper.EmbeddedQueriesMetricName {
 			isEmbedded = true
 		}
 
diff --git a/pkg/querier/queryrange/queryable_test.go b/pkg/querier/queryrange/queryable_test.go
index 5b42ec9fbf6..162ee210554 100644
--- a/pkg/querier/queryrange/queryable_test.go
+++ b/pkg/querier/queryrange/queryable_test.go
@@ -53,10 +53,12 @@ func TestSelect(t *testing.T) {
 					},
 				)
 
-				_, _, err := q.Select(
+				encoded, err := astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})
+				require.Nil(t, err)
+				_, _, err = q.Select(
 					nil,
-					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
-					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+					exactMatch("__name__", astmapper.EmbeddedQueriesMetricName),
+					exactMatch(astmapper.QueryLabel, encoded),
 				)
 				require.Nil(t, err)
 			},
@@ -70,10 +72,12 @@ func TestSelect(t *testing.T) {
 				nil,
 			)),
 			fn: func(t *testing.T, q *DownstreamQuerier) {
+				encoded, err := astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})
+				require.Nil(t, err)
 				set, _, err := q.Select(
 					nil,
-					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
-					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+					exactMatch("__name__", astmapper.EmbeddedQueriesMetricName),
+					exactMatch(astmapper.QueryLabel, encoded),
 				)
 				require.Nil(t, set)
 				require.EqualError(t, err, "SomeErr")
@@ -124,10 +128,12 @@ func TestSelect(t *testing.T) {
 				nil,
 			)),
 			fn: func(t *testing.T, q *DownstreamQuerier) {
+				encoded, err := astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})
+				require.Nil(t, err)
 				set, _, err := q.Select(
 					nil,
-					exactMatch("__name__", astmapper.EmbeddedQueryFlag),
-					exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})),
+					exactMatch("__name__", astmapper.EmbeddedQueriesMetricName),
+					exactMatch(astmapper.QueryLabel, encoded),
 				)
 				require.Nil(t, err)
 				require.Equal(
@@ -226,10 +232,12 @@ func TestSelectConcurrent(t *testing.T) {
 				},
 			}, c.err))
 
+			encoded, err := astmapper.JSONCodec.Encode(c.queries)
+			require.Nil(t, err)
 			set, _, err := querier.Select(
 				nil,
-				exactMatch("__name__", astmapper.EmbeddedQueryFlag),
-				exactMatch(astmapper.QueryLabel, astmapper.JSONCodec.Encode(c.queries)),
+				exactMatch("__name__", astmapper.EmbeddedQueriesMetricName),
+				exactMatch(astmapper.QueryLabel, encoded),
 			)
 
 			if c.err != nil {
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index 9ad17989a95..5ec6dbd86b7 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -140,7 +140,7 @@ func (ast *astMapperware) Do(ctx context.Context, r Request) (Response, error) {
 	conf, err := ast.confs.GetConf(r)
 	// cannot shard with this timerange
 	if err != nil {
-		level.Warn(ast.logger).Log("err", err.Error())
+		level.Warn(ast.logger).Log("err", err.Error(), "msg", "skipped AST mapper for request")
 		return ast.next.Do(ctx, r)
 	}
 
@@ -298,9 +298,7 @@ func partitionRequest(r Request, t time.Time) (before Request, after Request) {
 
 // TimeFromMillis is a helper to turn milliseconds -> time.Time
 func TimeFromMillis(ms int64) time.Time {
-	secs := ms / 1000
-	rem := ms - (secs * 1000)
-	return time.Unix(secs, rem*nanosecondsInMillisecond)
+	return time.Unix(0, ms*nanosecondsInMillisecond)
 }
 
 func TimeToMillis(t time.Time) int64 {
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index 08c81bb06ad..3f9143e38eb 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -36,10 +36,14 @@ import (
 
 const day = 24 * time.Hour
 
-// PassthroughMiddleware is a noop middleware
-var PassthroughMiddleware = MiddlewareFunc(func(next Handler) Handler {
-	return next
-})
+var (
+	// PassthroughMiddleware is a noop middleware
+	PassthroughMiddleware = MiddlewareFunc(func(next Handler) Handler {
+		return next
+	})
+
+	errInvalidMinShardingLookback = errors.New("a non-zero value is required for querier.query-ingesters-within when querier.sum-shards is enabled")
+)
 
 // Config for query_range middleware chain.
 type Config struct {
@@ -145,7 +149,7 @@ func NewTripperware(
 	if cfg.SumShards {
 
 		if minShardingLookback == 0 {
-			return nil, nil, errors.New("a non-zero value is required for querier.query-ingesters-within when querier.sum-shards is enabled")
+			return nil, nil, errInvalidMinShardingLookback
 		}
 
 		shardingware := NewQueryShardMiddleware(
diff --git a/pkg/querier/queryrange/roundtrip_test.go b/pkg/querier/queryrange/roundtrip_test.go
index 082cfdb3572..e3a892b57ec 100644
--- a/pkg/querier/queryrange/roundtrip_test.go
+++ b/pkg/querier/queryrange/roundtrip_test.go
@@ -118,5 +118,5 @@ func Test_ShardingConfigError(t *testing.T) {
 		0,
 	)
 
-	require.EqualError(t, err, "a non-zero value is required for querier.query-ingesters-within when querier.sum-shards is enabled")
+	require.EqualError(t, err, errInvalidMinShardingLookback.Error())
 }

From a309f6220ec36e5e5af7d7c2733d47459dafb8ff Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 10:08:54 -0500
Subject: [PATCH 20/25] stylistic changes

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/chunk/schema.go                     |  3 +--
 pkg/chunk/series_store.go               |  1 -
 pkg/querier/astmapper/astmapper.go      |  4 ++--
 pkg/querier/astmapper/embedded.go       |  3 +--
 pkg/querier/astmapper/parallel.go       | 22 +++++++++---------
 pkg/querier/astmapper/parallel_test.go  |  4 ++--
 pkg/querier/astmapper/shard_summer.go   | 31 +++++++++++--------------
 pkg/querier/astmapper/subtree_folder.go |  4 ++--
 pkg/querier/queryrange/queryable.go     |  2 +-
 pkg/querier/queryrange/roundtrip.go     |  1 -
 pkg/querier/queryrange/value.go         |  1 -
 11 files changed, 34 insertions(+), 42 deletions(-)

diff --git a/pkg/chunk/schema.go b/pkg/chunk/schema.go
index 26f25d1f649..7a9441e0d73 100644
--- a/pkg/chunk/schema.go
+++ b/pkg/chunk/schema.go
@@ -5,9 +5,8 @@ import (
 	"encoding/hex"
 	"errors"
 	"fmt"
-	"strings"
-
 	"strconv"
+	"strings"
 
 	"github.com/go-kit/kit/log/level"
 	jsoniter "github.com/json-iterator/go"
diff --git a/pkg/chunk/series_store.go b/pkg/chunk/series_store.go
index a41f8ea4047..c4bb30518a5 100644
--- a/pkg/chunk/series_store.go
+++ b/pkg/chunk/series_store.go
@@ -537,7 +537,6 @@ func (c *seriesStore) calculateIndexEntries(ctx context.Context, from, through m
 
 func injectShardLabels(chunks []Chunk, shard astmapper.ShardAnnotation) {
 	for i, chunk := range chunks {
-
 		b := labels.NewBuilder(chunk.Metric)
 		l := shard.Label()
 		b.Set(l.Name, l.Value)
diff --git a/pkg/querier/astmapper/astmapper.go b/pkg/querier/astmapper/astmapper.go
index a93cd69161d..0263645294d 100644
--- a/pkg/querier/astmapper/astmapper.go
+++ b/pkg/querier/astmapper/astmapper.go
@@ -23,7 +23,7 @@ type MultiMapper struct {
 	mappers []ASTMapper
 }
 
-// Map impls ASTMapper
+// Map implements ASTMapper
 func (m *MultiMapper) Map(node promql.Node) (promql.Node, error) {
 	var result promql.Node = node
 	var err error
@@ -87,7 +87,7 @@ type ASTNodeMapper struct {
 	NodeMapper
 }
 
-// Map impls ASTMapper from a NodeMapper
+// Map implements ASTMapper from a NodeMapper
 func (nm ASTNodeMapper) Map(node promql.Node) (promql.Node, error) {
 	node, fin, err := nm.MapNode(node)
 
diff --git a/pkg/querier/astmapper/embedded.go b/pkg/querier/astmapper/embedded.go
index 645e4fc3866..fd448803b6f 100644
--- a/pkg/querier/astmapper/embedded.go
+++ b/pkg/querier/astmapper/embedded.go
@@ -30,7 +30,7 @@ type EmbeddedQueries struct {
 	Concat []string `json:"Concat"`
 }
 
-// JSONCodec is a Codec impl that uses JSON representations of EmbeddedQueries structs
+// JSONCodec is a Codec that uses JSON representations of EmbeddedQueries structs
 var JSONCodec jsonCodec
 
 type jsonCodec struct{}
@@ -70,7 +70,6 @@ func VectorSquasher(nodes ...promql.Node) (promql.Expr, error) {
 	}
 
 	embeddedQuery, err := labels.NewMatcher(labels.MatchEqual, QueryLabel, encoded)
-
 	if err != nil {
 		return nil, err
 	}
diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
index 1ee6fef0ed5..e14489083a6 100644
--- a/pkg/querier/astmapper/parallel.go
+++ b/pkg/querier/astmapper/parallel.go
@@ -23,9 +23,9 @@ var nonParallelFuncs = []string{
 	"absent",
 }
 
-// CanParallel tests if a subtree is parallelizable.
+// CanParallelize tests if a subtree is parallelizable.
 // A subtree is parallelizable if all of its components are parallelizable.
-func CanParallel(node promql.Node) bool {
+func CanParallelize(node promql.Node) bool {
 	switch n := node.(type) {
 	case nil:
 		// nil handles cases where we check optional fields that are not set
@@ -33,7 +33,7 @@ func CanParallel(node promql.Node) bool {
 
 	case promql.Expressions:
 		for _, e := range n {
-			if !CanParallel(e) {
+			if !CanParallelize(e) {
 				return false
 			}
 		}
@@ -41,7 +41,7 @@ func CanParallel(node promql.Node) bool {
 
 	case *promql.AggregateExpr:
 		_, ok := summableAggregates[n.Op]
-		return ok && CanParallel(n.Expr)
+		return ok && CanParallelize(n.Expr)
 
 	case *promql.BinaryExpr:
 		// since binary exprs use each side for merging, they cannot be parallelized
@@ -51,29 +51,29 @@ func CanParallel(node promql.Node) bool {
 		if n.Func == nil {
 			return false
 		}
-		if !ParallelFunc(*n.Func) {
+		if !ParallelizableFunc(*n.Func) {
 			return false
 		}
 
 		for _, e := range n.Args {
-			if !CanParallel(e) {
+			if !CanParallelize(e) {
 				return false
 			}
 		}
 		return true
 
 	case *promql.SubqueryExpr:
-		return CanParallel(n.Expr)
+		return CanParallelize(n.Expr)
 
 	case *promql.ParenExpr:
-		return CanParallel(n.Expr)
+		return CanParallelize(n.Expr)
 
 	case *promql.UnaryExpr:
 		// Since these are only currently supported for Scalars, should be parallel-compatible
 		return true
 
 	case *promql.EvalStmt:
-		return CanParallel(n.Expr)
+		return CanParallelize(n.Expr)
 
 	case *promql.MatrixSelector, *promql.NumberLiteral, *promql.StringLiteral, *promql.VectorSelector:
 		return true
@@ -85,8 +85,8 @@ func CanParallel(node promql.Node) bool {
 
 }
 
-// ParallelFunc ensures that a promql function can be part of a parallel query.
-func ParallelFunc(f promql.Function) bool {
+// ParallelizableFunc ensures that a promql function can be part of a parallel query.
+func ParallelizableFunc(f promql.Function) bool {
 
 	for _, v := range nonParallelFuncs {
 		if v == f.Name {
diff --git a/pkg/querier/astmapper/parallel_test.go b/pkg/querier/astmapper/parallel_test.go
index 890b9c34690..1ad07d39980 100644
--- a/pkg/querier/astmapper/parallel_test.go
+++ b/pkg/querier/astmapper/parallel_test.go
@@ -81,7 +81,7 @@ func TestCanParallel(t *testing.T) {
 
 	for i, c := range testExpr {
 		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
-			res := CanParallel(c.input)
+			res := CanParallelize(c.input)
 			require.Equal(t, c.expected, res)
 		})
 	}
@@ -112,7 +112,7 @@ func TestCanParallel_String(t *testing.T) {
 		t.Run(fmt.Sprintf("[%d]", i), func(t *testing.T) {
 			expr, err := promql.ParseExpr(c.input)
 			require.Nil(t, err)
-			res := CanParallel(expr)
+			res := CanParallelize(expr)
 			require.Equal(t, c.expected, res)
 		})
 	}
diff --git a/pkg/querier/astmapper/shard_summer.go b/pkg/querier/astmapper/shard_summer.go
index 533fc13eb20..c437f0ca231 100644
--- a/pkg/querier/astmapper/shard_summer.go
+++ b/pkg/querier/astmapper/shard_summer.go
@@ -2,12 +2,9 @@ package astmapper
 
 import (
 	"fmt"
-
 	"regexp"
-
-	"strings"
-
 	"strconv"
+	"strings"
 
 	"github.com/pkg/errors"
 	"github.com/prometheus/prometheus/pkg/labels"
@@ -29,28 +26,28 @@ var (
 type squasher = func(...promql.Node) (promql.Expr, error)
 
 type shardSummer struct {
-	shards   int
-	curshard *int
-	squash   squasher
+	shards       int
+	currentShard *int
+	squash       squasher
 }
 
-// NewShardSummer instantiates an ASTMapper which will fan out sums queries by shard
+// NewShardSummer instantiates an ASTMapper which will fan out sum queries by shard
 func NewShardSummer(shards int, squasher squasher) (ASTMapper, error) {
 	if squasher == nil {
 		return nil, errors.Errorf("squasher required and not passed")
 	}
 
 	return NewASTNodeMapper(&shardSummer{
-		shards:   shards,
-		squash:   squasher,
-		curshard: nil,
+		shards:       shards,
+		squash:       squasher,
+		currentShard: nil,
 	}), nil
 }
 
 // CopyWithCurShard clones a shardSummer with a new current shard.
 func (summer *shardSummer) CopyWithCurShard(curshard int) *shardSummer {
 	s := *summer
-	s.curshard = &curshard
+	s.currentShard = &curshard
 	return &s
 }
 
@@ -59,7 +56,7 @@ func (summer *shardSummer) MapNode(node promql.Node) (promql.Node, bool, error)
 
 	switch n := node.(type) {
 	case *promql.AggregateExpr:
-		if CanParallel(n) && n.Op == promql.SUM {
+		if CanParallelize(n) && n.Op == promql.SUM {
 			result, err := summer.shardSum(n)
 			return result, true, err
 		}
@@ -67,15 +64,15 @@ func (summer *shardSummer) MapNode(node promql.Node) (promql.Node, bool, error)
 		return n, false, nil
 
 	case *promql.VectorSelector:
-		if summer.curshard != nil {
-			mapped, err := shardVectorSelector(*summer.curshard, summer.shards, n)
+		if summer.currentShard != nil {
+			mapped, err := shardVectorSelector(*summer.currentShard, summer.shards, n)
 			return mapped, true, err
 		}
 		return n, true, nil
 
 	case *promql.MatrixSelector:
-		if summer.curshard != nil {
-			mapped, err := shardMatrixSelector(*summer.curshard, summer.shards, n)
+		if summer.currentShard != nil {
+			mapped, err := shardMatrixSelector(*summer.currentShard, summer.shards, n)
 			return mapped, true, err
 		}
 		return n, true, nil
diff --git a/pkg/querier/astmapper/subtree_folder.go b/pkg/querier/astmapper/subtree_folder.go
index 8eb66e25805..5d142bea116 100644
--- a/pkg/querier/astmapper/subtree_folder.go
+++ b/pkg/querier/astmapper/subtree_folder.go
@@ -18,7 +18,7 @@ func NewSubtreeFolder() ASTMapper {
 	return NewASTNodeMapper(&subtreeFolder{})
 }
 
-// MapNode impls NodeMapper
+// MapNode implements NodeMapper
 func (f *subtreeFolder) MapNode(node promql.Node) (promql.Node, bool, error) {
 	switch n := node.(type) {
 	// do not attempt to fold number or string leaf nodes
@@ -75,7 +75,7 @@ type visitor struct {
 	result bool
 }
 
-// Visit impls promql.Visitor
+// Visit implements promql.Visitor
 func (v *visitor) Visit(node promql.Node, path []promql.Node) (promql.Visitor, error) {
 	// if the visitor has already seen a predicate success, don't overwrite
 	if v.result {
diff --git a/pkg/querier/queryrange/queryable.go b/pkg/querier/queryrange/queryable.go
index e3881512b36..f655325ae33 100644
--- a/pkg/querier/queryrange/queryable.go
+++ b/pkg/querier/queryrange/queryable.go
@@ -21,7 +21,7 @@ type DownstreamQueryable struct {
 	Handler Handler
 }
 
-// Querier impls Queryable
+// Querier implements Queryable
 func (q *DownstreamQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
 	return &DownstreamQuerier{ctx, q.Req, q.Handler}, nil
 }
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index 3f9143e38eb..f70b00647ca 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -147,7 +147,6 @@ func NewTripperware(
 	}
 
 	if cfg.SumShards {
-
 		if minShardingLookback == 0 {
 			return nil, nil, errInvalidMinShardingLookback
 		}
diff --git a/pkg/querier/queryrange/value.go b/pkg/querier/queryrange/value.go
index ce3c0edcbe6..e8b8095ee2a 100644
--- a/pkg/querier/queryrange/value.go
+++ b/pkg/querier/queryrange/value.go
@@ -100,7 +100,6 @@ func ResponseToSamples(resp Response) ([]SampleStream, error) {
 
 // NewSeriesSet returns an in memory storage.SeriesSet from a []SampleStream
 func NewSeriesSet(results []SampleStream) storage.SeriesSet {
-
 	set := make([]storage.Series, 0, len(results))
 
 	for _, stream := range results {

From bc3f7f5cd05d0570b87080d1ad4369beeff3d12e Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 10:15:51 -0500
Subject: [PATCH 21/25] s/downstream/sharded/

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 pkg/querier/astmapper/parallel.go        |  3 ++-
 pkg/querier/queryrange/queryable.go      | 22 +++++++++++-----------
 pkg/querier/queryrange/queryable_test.go | 16 ++++++++--------
 pkg/querier/queryrange/querysharding.go  |  2 +-
 4 files changed, 22 insertions(+), 21 deletions(-)

diff --git a/pkg/querier/astmapper/parallel.go b/pkg/querier/astmapper/parallel.go
index e14489083a6..d0fee3c430c 100644
--- a/pkg/querier/astmapper/parallel.go
+++ b/pkg/querier/astmapper/parallel.go
@@ -3,9 +3,10 @@ package astmapper
 import (
 	"fmt"
 
-	"github.com/cortexproject/cortex/pkg/util"
 	"github.com/go-kit/kit/log/level"
 	"github.com/prometheus/prometheus/promql"
+
+	"github.com/cortexproject/cortex/pkg/util"
 )
 
 var summableAggregates = map[promql.ItemType]struct{}{
diff --git a/pkg/querier/queryrange/queryable.go b/pkg/querier/queryrange/queryable.go
index f655325ae33..01ebe6b6865 100644
--- a/pkg/querier/queryrange/queryable.go
+++ b/pkg/querier/queryrange/queryable.go
@@ -15,26 +15,26 @@ const (
 	nonEmbeddedErrMsg       = "DownstreamQuerier cannot handle a non-embedded query"
 )
 
-// DownstreamQueryable is an implementor of the Queryable interface.
-type DownstreamQueryable struct {
+// ShardedQueryable is an implementor of the Queryable interface.
+type ShardedQueryable struct {
 	Req     Request
 	Handler Handler
 }
 
 // Querier implements Queryable
-func (q *DownstreamQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
-	return &DownstreamQuerier{ctx, q.Req, q.Handler}, nil
+func (q *ShardedQueryable) Querier(ctx context.Context, mint, maxt int64) (storage.Querier, error) {
+	return &ShardedQuerier{ctx, q.Req, q.Handler}, nil
 }
 
-// DownstreamQuerier is a an implementor of the Querier interface.
-type DownstreamQuerier struct {
+// ShardedQuerier is a an implementor of the Querier interface.
+type ShardedQuerier struct {
 	Ctx     context.Context
 	Req     Request
 	Handler Handler
 }
 
 // Select returns a set of series that matches the given label matchers.
-func (q *DownstreamQuerier) Select(
+func (q *ShardedQuerier) Select(
 	_ *storage.SelectParams,
 	matchers ...*labels.Matcher,
 ) (storage.SeriesSet, storage.Warnings, error) {
@@ -62,7 +62,7 @@ func (q *DownstreamQuerier) Select(
 }
 
 // handleEmbeddedQuery defers execution of an encoded query to a downstream Handler
-func (q *DownstreamQuerier) handleEmbeddedQuery(encoded string) (storage.SeriesSet, storage.Warnings, error) {
+func (q *ShardedQuerier) handleEmbeddedQuery(encoded string) (storage.SeriesSet, storage.Warnings, error) {
 	queries, err := astmapper.JSONCodec.Decode(encoded)
 	if err != nil {
 		return nil, nil, err
@@ -106,16 +106,16 @@ func (q *DownstreamQuerier) handleEmbeddedQuery(encoded string) (storage.SeriesS
 }
 
 // LabelValues returns all potential values for a label name.
-func (q *DownstreamQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
+func (q *ShardedQuerier) LabelValues(name string) ([]string, storage.Warnings, error) {
 	return nil, nil, errors.Errorf("unimplemented")
 }
 
 // LabelNames returns all the unique label names present in the block in sorted order.
-func (q *DownstreamQuerier) LabelNames() ([]string, storage.Warnings, error) {
+func (q *ShardedQuerier) LabelNames() ([]string, storage.Warnings, error) {
 	return nil, nil, errors.Errorf("unimplemented")
 }
 
 // Close releases the resources of the Querier.
-func (q *DownstreamQuerier) Close() error {
+func (q *ShardedQuerier) Close() error {
 	return nil
 }
diff --git a/pkg/querier/queryrange/queryable_test.go b/pkg/querier/queryrange/queryable_test.go
index 162ee210554..36006c71195 100644
--- a/pkg/querier/queryrange/queryable_test.go
+++ b/pkg/querier/queryrange/queryable_test.go
@@ -16,15 +16,15 @@ import (
 func TestSelect(t *testing.T) {
 	var testExpr = []struct {
 		name    string
-		querier *DownstreamQuerier
-		fn      func(*testing.T, *DownstreamQuerier)
+		querier *ShardedQuerier
+		fn      func(*testing.T, *ShardedQuerier)
 	}{
 		{
 			name: "errors non embedded query",
 			querier: mkQuerier(
 				nil,
 			),
-			fn: func(t *testing.T, q *DownstreamQuerier) {
+			fn: func(t *testing.T, q *ShardedQuerier) {
 				set, _, err := q.Select(nil)
 				require.Nil(t, set)
 				require.EqualError(t, err, nonEmbeddedErrMsg)
@@ -36,7 +36,7 @@ func TestSelect(t *testing.T) {
 				&PrometheusResponse{},
 				nil,
 			)),
-			fn: func(t *testing.T, q *DownstreamQuerier) {
+			fn: func(t *testing.T, q *ShardedQuerier) {
 
 				expected := &PrometheusResponse{
 					Status: "success",
@@ -71,7 +71,7 @@ func TestSelect(t *testing.T) {
 				},
 				nil,
 			)),
-			fn: func(t *testing.T, q *DownstreamQuerier) {
+			fn: func(t *testing.T, q *ShardedQuerier) {
 				encoded, err := astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})
 				require.Nil(t, err)
 				set, _, err := q.Select(
@@ -127,7 +127,7 @@ func TestSelect(t *testing.T) {
 				},
 				nil,
 			)),
-			fn: func(t *testing.T, q *DownstreamQuerier) {
+			fn: func(t *testing.T, q *ShardedQuerier) {
 				encoded, err := astmapper.JSONCodec.Encode([]string{`http_requests_total{cluster="prod"}`})
 				require.Nil(t, err)
 				set, _, err := q.Select(
@@ -264,6 +264,6 @@ func exactMatch(k, v string) *labels.Matcher {
 
 }
 
-func mkQuerier(handler Handler) *DownstreamQuerier {
-	return &DownstreamQuerier{context.Background(), &PrometheusRequest{}, handler}
+func mkQuerier(handler Handler) *ShardedQuerier {
+	return &ShardedQuerier{context.Background(), &PrometheusRequest{}, handler}
 }
diff --git a/pkg/querier/queryrange/querysharding.go b/pkg/querier/queryrange/querysharding.go
index 5ec6dbd86b7..297c2fe39d3 100644
--- a/pkg/querier/queryrange/querysharding.go
+++ b/pkg/querier/queryrange/querysharding.go
@@ -185,7 +185,7 @@ func (qs *queryShard) Do(ctx context.Context, r Request) (Response, error) {
 		return qs.next.Do(ctx, r)
 	}
 
-	queryable := lazyquery.NewLazyQueryable(&DownstreamQueryable{r, qs.next})
+	queryable := lazyquery.NewLazyQueryable(&ShardedQueryable{r, qs.next})
 
 	qry, err := qs.engine.NewRangeQuery(
 		queryable,

From 1a159f06acab73cb21aee5648072bf0196672f0e Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 10:39:29 -0500
Subject: [PATCH 22/25] s/sum_shards/parallelise_shardable_queries/

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 CHANGELOG.md                                | 2 +-
 docs/configuration/arguments.md             | 2 +-
 docs/configuration/config-file-reference.md | 6 +++---
 pkg/querier/queryrange/roundtrip.go         | 6 +++---
 pkg/querier/queryrange/roundtrip_test.go    | 2 +-
 5 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 09cdf7eb584..e8203a5a5c0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -3,7 +3,7 @@
 ## master / unreleased
 
 * [FEATURE] Fan out parallelizable queries to backend queriers concurrently. #1878
-  * `-querier.sum-shards` (bool)
+  * `querier.parallelise-shardable-queries` (bool)
   * Requires a shard-compatible schema (v10+)
   * This causes the number of traces to increase accordingly.
   * The query-frontend now requires a schema config to determine how/when to shard queries, either from a file or from flags (i.e. by the `config-yaml` CLI flag). This is the same schema config the queriers consume. The schema is only required to use this option.
diff --git a/docs/configuration/arguments.md b/docs/configuration/arguments.md
index 266c1b28059..94acfd86878 100644
--- a/docs/configuration/arguments.md
+++ b/docs/configuration/arguments.md
@@ -68,7 +68,7 @@ The ingester query API was improved over time, but defaults to the old behaviour
 
 ## Query Frontend
 
-- `-querier.sum-shards`
+- `-querier.parallelise-shardable-queries`
 
    If set to true, will cause the query frontend to mutate incoming queries when possible by turning `sum` operations into sharded `sum` operations. This requires a shard-compatible schema (v10+). An abridged example:
    `sum by (foo) (rate(bar{baz=”blip”}[1m]))` ->
diff --git a/docs/configuration/config-file-reference.md b/docs/configuration/config-file-reference.md
index 4b22c5b6f33..c60c1c84a63 100644
--- a/docs/configuration/config-file-reference.md
+++ b/docs/configuration/config-file-reference.md
@@ -642,9 +642,9 @@ results_cache:
 # CLI flag: -querier.max-retries-per-request
 [max_retries: <int> | default = 5]
 
-# Parse the ast and parallelize sums by shard.
-# CLI flag: -querier.sum-shards
-[sum_shards: <boolean> | default = false]
+# Perform query parallelisations based on storage sharding configuration and query ASTs.
+# CLI flag: -querier.parallelise-shardable-queries
+[parallelise_shardable_queries: <boolean> | default = false]
 ```
 
 ## `ruler_config`
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index f70b00647ca..1f43c7ef629 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -53,7 +53,7 @@ type Config struct {
 	ResultsCacheConfig     `yaml:"results_cache"`
 	CacheResults           bool `yaml:"cache_results"`
 	MaxRetries             int  `yaml:"max_retries"`
-	SumShards              bool `yaml:"sum_shards"`
+	ShardedQueries         bool `yaml:"parallelise_shardable_queries"`
 }
 
 // RegisterFlags adds the flags required to config this to the given FlagSet.
@@ -63,7 +63,7 @@ func (cfg *Config) RegisterFlags(f *flag.FlagSet) {
 	f.DurationVar(&cfg.SplitQueriesByInterval, "querier.split-queries-by-interval", 0, "Split queries by an interval and execute in parallel, 0 disables it. You should use an a multiple of 24 hours (same as the storage bucketing scheme), to avoid queriers downloading and processing the same chunks. This also determines how cache keys are chosen when result caching is enabled")
 	f.BoolVar(&cfg.AlignQueriesWithStep, "querier.align-querier-with-step", false, "Mutate incoming queries to align their start and end with their step.")
 	f.BoolVar(&cfg.CacheResults, "querier.cache-results", false, "Cache query results.")
-	f.BoolVar(&cfg.SumShards, "querier.sum-shards", false, "Parse the ast and parallelize sums by shard.")
+	f.BoolVar(&cfg.ShardedQueries, "querier.parallelise-shardable-queries", false, "Perform query parallelisations based on storage sharding configuration and query ASTs.")
 	cfg.ResultsCacheConfig.RegisterFlags(f)
 }
 
@@ -146,7 +146,7 @@ func NewTripperware(
 		queryRangeMiddleware = append(queryRangeMiddleware, InstrumentMiddleware("results_cache"), queryCacheMiddleware)
 	}
 
-	if cfg.SumShards {
+	if cfg.ShardedQueries {
 		if minShardingLookback == 0 {
 			return nil, nil, errInvalidMinShardingLookback
 		}
diff --git a/pkg/querier/queryrange/roundtrip_test.go b/pkg/querier/queryrange/roundtrip_test.go
index e3a892b57ec..e9423983c38 100644
--- a/pkg/querier/queryrange/roundtrip_test.go
+++ b/pkg/querier/queryrange/roundtrip_test.go
@@ -108,7 +108,7 @@ func (s singleHostRoundTripper) RoundTrip(r *http.Request) (*http.Response, erro
 
 func Test_ShardingConfigError(t *testing.T) {
 	_, _, err := NewTripperware(
-		Config{SumShards: true},
+		Config{ShardedQueries: true},
 		log.NewNopLogger(),
 		nil,
 		nil,

From 65718dbda4da05659aae5cf7117a8e3c06fe9872 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 11:03:55 -0500
Subject: [PATCH 23/25] query-audit docs

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 docs/configuration/config-file-reference.md |   3 +-
 docs/operations/query-auditor.md            | 139 ++++++++++++++++++++
 2 files changed, 141 insertions(+), 1 deletion(-)
 create mode 100644 docs/operations/query-auditor.md

diff --git a/docs/configuration/config-file-reference.md b/docs/configuration/config-file-reference.md
index c60c1c84a63..5d4eddc2a73 100644
--- a/docs/configuration/config-file-reference.md
+++ b/docs/configuration/config-file-reference.md
@@ -642,7 +642,8 @@ results_cache:
 # CLI flag: -querier.max-retries-per-request
 [max_retries: <int> | default = 5]
 
-# Perform query parallelisations based on storage sharding configuration and query ASTs.
+# Perform query parallelisations based on storage sharding configuration and
+# query ASTs.
 # CLI flag: -querier.parallelise-shardable-queries
 [parallelise_shardable_queries: <boolean> | default = false]
 ```
diff --git a/docs/operations/query-auditor.md b/docs/operations/query-auditor.md
new file mode 100644
index 00000000000..6c23fbfa217
--- /dev/null
+++ b/docs/operations/query-auditor.md
@@ -0,0 +1,139 @@
+---
+title: "Query Auditor (tool)"
+linkTitle: "query auditor (tool)"
+weight: 1
+slug: query-auditor
+---
+
+The query auditor is a tool bundled in the cortex repo, but **not** included in docker images -- this must be built from source. It's primarily useful for those _developing_ cortex, but can be helpful to operators as well during certain scenarios (backend migrations come to mind).
+
+## How it works
+
+The `query-audit` tool performs a set of queries against two backends that expose the prometheus read API. This is generally the `query-frontend` component of two cortex deployments. It will then compare the differences in the responses to determine the average difference for each query. It does this by:
+ - Ensuring the resulting label sets match
+ - For each label set, ensuring they contain the same number of samples as their pair from the other backend
+ - For each sample, calculates their difference against it's pair from the other backend/label set.
+ - Calculates the average diff per query from the above diffs.
+
+### Limitations
+
+It currently only supports queries with `Matrix` response types, but should be simple to extend to `Vector`s as well, should the need arise.
+
+### Use cases
+
+- Correctness testing when working on the read path.
+- Comparing results from different backends.
+
+### Example Configuration
+
+```yaml
+control:
+  host: http://localhost:8080/api/prom
+  headers:
+    "X-Scope-OrgID": 1234
+
+test:
+  host: http://localhost:8081/api/prom
+  headers:
+    "X-Scope-OrgID": 1234
+
+queries:
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m]))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-28T00:00:00Z
+    step_size: 15m
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m])) by (container_name)'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-28T00:00:00Z
+    step_size: 15m
+  - query: 'sum(rate(container_cpu_usage_seconds_total[5m])) without (container_name)'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-26T00:00:00Z
+    step_size: 15m
+  - query: 'histogram_quantile(0.9, sum(rate(cortex_cache_value_size_bytes_bucket[5m])) by (le, job))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
+    # two shardable legs
+  - query: 'sum without (instance, job) (rate(cortex_query_frontend_queue_length[5m])) or sum by (job) (rate(cortex_query_frontend_queue_length[5m]))'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
+    # one shardable leg
+  - query: 'sum without (instance, job) (rate(cortex_cache_request_duration_seconds_count[5m])) or rate(cortex_cache_request_duration_seconds_count[5m])'
+    start: 2019-11-25T00:00:00Z
+    end: 2019-11-25T06:00:00Z
+    step_size: 15m
+```
+
+### Example Output
+
+Under ideal circumstances, you'll see output like the following:
+
+```
+$ go install ./tools/query-audit/ && query-audit -f ~/grafana/tmp/equivalence-config.yaml
+
+0.000000% avg diff for:
+        query: sum(rate(container_cpu_usage_seconds_total[5m]))
+        series: 1
+        samples: 289
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-28 00:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum(rate(container_cpu_usage_seconds_total[5m])) by (container_name)
+        series: 95
+        samples: 25877
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-28 00:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum(rate(container_cpu_usage_seconds_total[5m])) without (container_name)
+        series: 4308
+        samples: 374989
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-26 00:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: histogram_quantile(0.9, sum(rate(cortex_cache_value_size_bytes_bucket[5m])) by (le, job))
+        series: 13
+        samples: 325
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-25 06:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum without (instance, job) (rate(cortex_query_frontend_queue_length[5m])) or sum by (job) (rate(cortex_query_frontend_queue_length[5m]))
+        series: 21
+        samples: 525
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-25 06:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum without (instance, job) (rate(cortex_cache_request_duration_seconds_count[5m])) or rate(cortex_cache_request_duration_seconds_count[5m])
+        series: 942
+        samples: 23550
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-25 06:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum by (namespace) (predict_linear(container_cpu_usage_seconds_total[5m], 10))
+        series: 16
+        samples: 400
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-25 06:00:00 +0000 UTC
+        step: 15m0s
+
+0.000000% avg diff for:
+        query: sum by (namespace) (avg_over_time((rate(container_cpu_usage_seconds_total[5m]))[10m:]) > 1)
+        series: 4
+        samples: 52
+        start: 2019-11-25 00:00:00 +0000 UTC
+        end: 2019-11-25 01:00:00 +0000 UTC
+        step: 5m0s
+```

From 7e56489f1b9303ea22122c9de30a5b47c7475e2b Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 11:24:44 -0500
Subject: [PATCH 24/25] notes sharded parallelizations are only supported by
 chunk store

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 docs/configuration/config-file-reference.md | 2 +-
 pkg/querier/queryrange/roundtrip.go         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/configuration/config-file-reference.md b/docs/configuration/config-file-reference.md
index 5d4eddc2a73..1201fe0e839 100644
--- a/docs/configuration/config-file-reference.md
+++ b/docs/configuration/config-file-reference.md
@@ -643,7 +643,7 @@ results_cache:
 [max_retries: <int> | default = 5]
 
 # Perform query parallelisations based on storage sharding configuration and
-# query ASTs.
+# query ASTs. This feature is supported only by the chunks storage engine.
 # CLI flag: -querier.parallelise-shardable-queries
 [parallelise_shardable_queries: <boolean> | default = false]
 ```
diff --git a/pkg/querier/queryrange/roundtrip.go b/pkg/querier/queryrange/roundtrip.go
index 1f43c7ef629..505e6554a79 100644
--- a/pkg/querier/queryrange/roundtrip.go
+++ b/pkg/querier/queryrange/roundtrip.go
@@ -63,7 +63,7 @@ func (cfg *Config) RegisterFlags(f *flag.FlagSet) {
 	f.DurationVar(&cfg.SplitQueriesByInterval, "querier.split-queries-by-interval", 0, "Split queries by an interval and execute in parallel, 0 disables it. You should use an a multiple of 24 hours (same as the storage bucketing scheme), to avoid queriers downloading and processing the same chunks. This also determines how cache keys are chosen when result caching is enabled")
 	f.BoolVar(&cfg.AlignQueriesWithStep, "querier.align-querier-with-step", false, "Mutate incoming queries to align their start and end with their step.")
 	f.BoolVar(&cfg.CacheResults, "querier.cache-results", false, "Cache query results.")
-	f.BoolVar(&cfg.ShardedQueries, "querier.parallelise-shardable-queries", false, "Perform query parallelisations based on storage sharding configuration and query ASTs.")
+	f.BoolVar(&cfg.ShardedQueries, "querier.parallelise-shardable-queries", false, "Perform query parallelisations based on storage sharding configuration and query ASTs. This feature is supported only by the chunks storage engine.")
 	cfg.ResultsCacheConfig.RegisterFlags(f)
 }
 

From e6cb0b18e23e548e61c8fe4ee5b6df78d8b79ea9 Mon Sep 17 00:00:00 2001
From: Owen Diehl <ow.diehl@gmail.com>
Date: Thu, 20 Feb 2020 11:37:21 -0500
Subject: [PATCH 25/25] doc suggestions

Signed-off-by: Owen Diehl <ow.diehl@gmail.com>
---
 docs/operations/query-auditor.md | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/docs/operations/query-auditor.md b/docs/operations/query-auditor.md
index 6c23fbfa217..32828cef159 100644
--- a/docs/operations/query-auditor.md
+++ b/docs/operations/query-auditor.md
@@ -1,23 +1,24 @@
 ---
 title: "Query Auditor (tool)"
-linkTitle: "query auditor (tool)"
-weight: 1
+linkTitle: "Query Auditor (tool)"
+weight: 2
 slug: query-auditor
 ---
 
-The query auditor is a tool bundled in the cortex repo, but **not** included in docker images -- this must be built from source. It's primarily useful for those _developing_ cortex, but can be helpful to operators as well during certain scenarios (backend migrations come to mind).
+The query auditor is a tool bundled in the Cortex repository, but **not** included in Docker images -- this must be built from source. It's primarily useful for those _developing_ Cortex, but can be helpful to operators as well during certain scenarios (backend migrations come to mind).
 
 ## How it works
 
-The `query-audit` tool performs a set of queries against two backends that expose the prometheus read API. This is generally the `query-frontend` component of two cortex deployments. It will then compare the differences in the responses to determine the average difference for each query. It does this by:
- - Ensuring the resulting label sets match
- - For each label set, ensuring they contain the same number of samples as their pair from the other backend
+The `query-audit` tool performs a set of queries against two backends that expose the Prometheus read API. This is generally the `query-frontend` component of two Cortex deployments. It will then compare the differences in the responses to determine the average difference for each query. It does this by:
+
+ - Ensuring the resulting label sets match.
+ - For each label set, ensuring they contain the same number of samples as their pair from the other backend.
  - For each sample, calculates their difference against it's pair from the other backend/label set.
  - Calculates the average diff per query from the above diffs.
 
 ### Limitations
 
-It currently only supports queries with `Matrix` response types, but should be simple to extend to `Vector`s as well, should the need arise.
+It currently only supports queries with `Matrix` response types.
 
 ### Use cases
 
@@ -71,7 +72,7 @@ queries:
 Under ideal circumstances, you'll see output like the following:
 
 ```
-$ go install ./tools/query-audit/ && query-audit -f ~/grafana/tmp/equivalence-config.yaml
+$ go run ./tools/query-audit/ -f config.yaml
 
 0.000000% avg diff for:
         query: sum(rate(container_cpu_usage_seconds_total[5m]))