|
| 1 | +//go:build requires_docker |
| 2 | +// +build requires_docker |
| 3 | + |
| 4 | +package integration |
| 5 | + |
| 6 | +import ( |
| 7 | + "testing" |
| 8 | + "time" |
| 9 | + |
| 10 | + "github.com/prometheus/common/model" |
| 11 | + "github.com/prometheus/prometheus/prompb" |
| 12 | + "github.com/stretchr/testify/require" |
| 13 | + |
| 14 | + "github.com/cortexproject/cortex/integration/e2e" |
| 15 | + e2edb "github.com/cortexproject/cortex/integration/e2e/db" |
| 16 | + "github.com/cortexproject/cortex/integration/e2ecortex" |
| 17 | +) |
| 18 | + |
| 19 | +func TestDistriubtorAcceptMixedHASamplesRunningInMicroservicesMode(t *testing.T) { |
| 20 | + const blockRangePeriod = 5 * time.Minute |
| 21 | + |
| 22 | + t.Run("Distributor accept mixed HA samples in the same request", func(t *testing.T) { |
| 23 | + s, err := e2e.NewScenario(networkName) |
| 24 | + require.NoError(t, err) |
| 25 | + defer s.Close() |
| 26 | + |
| 27 | + // Start dependencies. |
| 28 | + consul := e2edb.NewConsul() |
| 29 | + etcd := e2edb.NewETCD() |
| 30 | + minio := e2edb.NewMinio(9000, bucketName) |
| 31 | + require.NoError(t, s.StartAndWaitReady(consul, etcd, minio)) |
| 32 | + |
| 33 | + // Configure the querier to only look in ingester |
| 34 | + // and enbale distributor ha tracker with mixed samples. |
| 35 | + distributorFlags := map[string]string{ |
| 36 | + "-distributor.ha-tracker.enable": "true", |
| 37 | + "-distributor.ha-tracker.enable-for-all-users": "true", |
| 38 | + "-experimental.distributor.ha-tracker.mixed-ha-samples": "true", |
| 39 | + "-distributor.ha-tracker.cluster": "cluster", |
| 40 | + "-distributor.ha-tracker.replica": "__replica__", |
| 41 | + "-distributor.ha-tracker.store": "etcd", |
| 42 | + "-distributor.ha-tracker.etcd.endpoints": "etcd:2379", |
| 43 | + } |
| 44 | + querierFlags := mergeFlags(BlocksStorageFlags(), map[string]string{ |
| 45 | + "-querier.query-store-after": (1 * time.Hour).String(), |
| 46 | + }) |
| 47 | + flags := mergeFlags(BlocksStorageFlags(), map[string]string{ |
| 48 | + "-blocks-storage.tsdb.block-ranges-period": blockRangePeriod.String(), |
| 49 | + "-blocks-storage.tsdb.ship-interval": "5s", |
| 50 | + "-blocks-storage.tsdb.retention-period": ((blockRangePeriod * 2) - 1).String(), |
| 51 | + "-blocks-storage.bucket-store.max-chunk-pool-bytes": "1", |
| 52 | + }) |
| 53 | + |
| 54 | + // Start Cortex components. |
| 55 | + distributor := e2ecortex.NewDistributor("distributor", e2ecortex.RingStoreConsul, consul.NetworkHTTPEndpoint(), distributorFlags, "") |
| 56 | + ingester := e2ecortex.NewIngester("ingester", e2ecortex.RingStoreConsul, consul.NetworkHTTPEndpoint(), flags, "") |
| 57 | + require.NoError(t, s.StartAndWaitReady(distributor, ingester)) |
| 58 | + |
| 59 | + // Wait until both the distributor and ingester have updated the ring. |
| 60 | + require.NoError(t, distributor.WaitSumMetrics(e2e.Equals(512), "cortex_ring_tokens_total")) |
| 61 | + |
| 62 | + distributorClient, err := e2ecortex.NewClient(distributor.HTTPEndpoint(), "", "", "", "user-1") |
| 63 | + require.NoError(t, err) |
| 64 | + |
| 65 | + // Push some series to Cortex. |
| 66 | + series1Timestamp := time.Now() |
| 67 | + series2Timestamp := series1Timestamp.Add(-2 * time.Second) |
| 68 | + series3Timestamp := series1Timestamp.Add(-4 * time.Second) |
| 69 | + series4Timestamp := series1Timestamp.Add(-6 * time.Second) |
| 70 | + series5Timestamp := series1Timestamp.Add(-8 * time.Second) |
| 71 | + series6Timestamp := series1Timestamp.Add(-10 * time.Second) |
| 72 | + series7Timestamp := series1Timestamp.Add(-12 * time.Second) |
| 73 | + series1, _ := generateSeries("foo", series1Timestamp, prompb.Label{Name: "__replica__", Value: "replica0"}, prompb.Label{Name: "cluster", Value: "cluster0"}) |
| 74 | + series2, _ := generateSeries("foo", series2Timestamp, prompb.Label{Name: "__replica__", Value: "replica1"}, prompb.Label{Name: "cluster", Value: "cluster0"}) |
| 75 | + series3, _ := generateSeries("foo", series3Timestamp, prompb.Label{Name: "__replica__", Value: "replica0"}, prompb.Label{Name: "cluster", Value: "cluster1"}) |
| 76 | + series4, _ := generateSeries("foo", series4Timestamp, prompb.Label{Name: "__replica__", Value: "replica1"}, prompb.Label{Name: "cluster", Value: "cluster1"}) |
| 77 | + series5, _ := generateSeries("foo", series5Timestamp, prompb.Label{Name: "__replica__", Value: "replicaNoCluster"}) |
| 78 | + series6, _ := generateSeries("foo", series6Timestamp, prompb.Label{Name: "cluster", Value: "clusterNoReplica"}) |
| 79 | + series7, _ := generateSeries("foo", series7Timestamp, prompb.Label{Name: "other", Value: "label"}) |
| 80 | + |
| 81 | + res, err := distributorClient.Push([]prompb.TimeSeries{series1[0], series2[0], series3[0], series4[0], series5[0], series6[0], series7[0]}) |
| 82 | + require.NoError(t, err) |
| 83 | + require.Equal(t, 200, res.StatusCode) |
| 84 | + |
| 85 | + // Wait until the samples have been deduped. |
| 86 | + require.NoError(t, distributor.WaitSumMetrics(e2e.Equals(2), "cortex_distributor_deduped_samples_total")) |
| 87 | + require.NoError(t, distributor.WaitSumMetrics(e2e.Equals(3), "cortex_distributor_non_ha_samples_received_total")) |
| 88 | + |
| 89 | + // Start the querier and store-gateway, and configure them to frequently sync blocks fast enough to trigger consistency check. |
| 90 | + storeGateway := e2ecortex.NewStoreGateway("store-gateway", e2ecortex.RingStoreConsul, consul.NetworkHTTPEndpoint(), flags, "") |
| 91 | + querier := e2ecortex.NewQuerier("querier", e2ecortex.RingStoreConsul, consul.NetworkHTTPEndpoint(), mergeFlags(querierFlags, flags), "") |
| 92 | + require.NoError(t, s.StartAndWaitReady(querier, storeGateway)) |
| 93 | + |
| 94 | + // Wait until the querier and store-gateway have updated the ring, and wait until the blocks are old enough for consistency check |
| 95 | + require.NoError(t, querier.WaitSumMetrics(e2e.Equals(512*2), "cortex_ring_tokens_total")) |
| 96 | + require.NoError(t, storeGateway.WaitSumMetrics(e2e.Equals(512), "cortex_ring_tokens_total")) |
| 97 | + |
| 98 | + // Query back the series. |
| 99 | + querierClient, err := e2ecortex.NewClient("", querier.HTTPEndpoint(), "", "", "user-1") |
| 100 | + require.NoError(t, err) |
| 101 | + |
| 102 | + // Query back the series (only in the ingesters). |
| 103 | + result, err := querierClient.Query("foo[5m]", series1Timestamp) |
| 104 | + require.NoError(t, err) |
| 105 | + |
| 106 | + require.Equal(t, model.ValMatrix, result.Type()) |
| 107 | + m := result.(model.Matrix) |
| 108 | + require.Equal(t, 5, m.Len()) |
| 109 | + numValidHA := 0 |
| 110 | + numNonHA := 0 |
| 111 | + for _, ss := range m { |
| 112 | + replicaLabel, okReplica := ss.Metric["__replica__"] |
| 113 | + if okReplica { |
| 114 | + require.Equal(t, string(replicaLabel), "replicaNoCluster") |
| 115 | + } |
| 116 | + clusterLabel, okCluster := ss.Metric["cluster"] |
| 117 | + if okCluster { |
| 118 | + require.Equal(t, string(clusterLabel) == "cluster1" || string(clusterLabel) == "cluster0" || string(clusterLabel) == "clusterNoReplica", true) |
| 119 | + if clusterLabel == "cluster1" || clusterLabel == "cluster0" { |
| 120 | + numValidHA++ |
| 121 | + } |
| 122 | + } |
| 123 | + if (okReplica && !okCluster && replicaLabel == "replicaNoCluster") || (okCluster && !okReplica && clusterLabel == "clusterNoReplica") || (!okCluster && !okReplica) { |
| 124 | + numNonHA++ |
| 125 | + } |
| 126 | + require.NotEmpty(t, ss.Values) |
| 127 | + for _, v := range ss.Values { |
| 128 | + require.NotEmpty(t, v) |
| 129 | + } |
| 130 | + } |
| 131 | + require.Equal(t, numNonHA, 3) |
| 132 | + require.Equal(t, numValidHA, 2) |
| 133 | + |
| 134 | + // Ensure no service-specific metrics prefix is used by the wrong service. |
| 135 | + assertServiceMetricsPrefixes(t, Distributor, distributor) |
| 136 | + assertServiceMetricsPrefixes(t, Ingester, ingester) |
| 137 | + assertServiceMetricsPrefixes(t, StoreGateway, storeGateway) |
| 138 | + assertServiceMetricsPrefixes(t, Querier, querier) |
| 139 | + }) |
| 140 | +} |
0 commit comments