grafana · duricanikolic · Oct 12, 2023 · Oct 4, 2023 · Oct 4, 2023 · Oct 5, 2023
@@ -4,72 +4,239 @@ package ingester
 
 import (
 	"errors"
+	"fmt"
 	"net/http"
 	"testing"
 	"time"
 
 	"github.com/grafana/dskit/httpgrpc"
+	"github.com/grafana/dskit/services"
 	"github.com/prometheus/common/model"
 	"github.com/prometheus/prometheus/model/labels"
-	"github.com/stretchr/testify/assert"
 	"github.com/stretchr/testify/require"
 	"google.golang.org/grpc/codes"
 	"google.golang.org/grpc/status"
 
 	"github.com/grafana/mimir/pkg/mimirpb"
+	"github.com/grafana/mimir/pkg/util/globalerror"
+	"github.com/grafana/mimir/pkg/util/validation"
 )
 
 const (
 	timestamp = model.Time(1575043969)
 )
 
-func TestNewIngestErrMsgs(t *testing.T) {
-	metricLabelAdapters := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
+func TestUnavailableError(t *testing.T) {
+	state := services.Starting
+	err := newUnavailableError(state)
+	require.Error(t, err)
+	expectedMsg := fmt.Sprintf(integerUnavailableMsgFormat, state)
+	require.EqualError(t, err, expectedMsg)
+	checkIngesterError(t, err, unavailable)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &unavailableError{})
+	checkIngesterError(t, wrappedErr, unavailable)
+}
+
+func TestInstanceLimitReachedError(t *testing.T) {
+	limitErrorMessage := "this is a limit error message"
+	err := newInstanceLimitReachedError(limitErrorMessage)
+	require.Error(t, err)
+	require.EqualError(t, err, limitErrorMessage)
+	checkIngesterError(t, err, instanceLimitReached)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &instanceLimitReachedError{})
+	checkIngesterError(t, wrappedErr, instanceLimitReached)
+}
+
+func TestNewTSDBUnavailableError(t *testing.T) {
+	tsdbErrMsg := "TSDB Head forced compaction in progress and no write request is currently allowed"
+	err := newTSDBUnavailableError(tsdbErrMsg)
+	require.Error(t, err)
+	require.EqualError(t, err, tsdbErrMsg)
+	checkIngesterError(t, err, tsdbUnavailable)
+
+	wrappedErr := fmt.Errorf("wrapped: %w", err)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &tsdbUnavailableError{})
+
+	wrappedWithUserErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedWithUserErr, err)
+	require.ErrorAs(t, wrappedWithUserErr, &tsdbUnavailableError{})
+	checkIngesterError(t, wrappedErr, tsdbUnavailable)
+}
+
+func TestNewPerUserSeriesLimitError(t *testing.T) {
+	limit := 100
+	err := newPerUserSeriesLimitReachedError(limit)
+	expectedErrMsg := globalerror.MaxSeriesPerUser.MessageWithPerTenantLimitConfig(
+		fmt.Sprintf("per-user series limit of %d exceeded", limit),
+		validation.MaxSeriesPerUserFlag,
+	)
+	require.Equal(t, expectedErrMsg, err.Error())
+	checkIngesterError(t, err, badData)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &perUserSeriesLimitReachedError{})
+	checkIngesterError(t, wrappedErr, badData)
+}
+
+func TestNewPerUserMetadataLimitError(t *testing.T) {
+	limit := 100
+	err := newPerUserMetadataLimitReachedError(limit)
+	expectedErrMsg := globalerror.MaxMetadataPerUser.MessageWithPerTenantLimitConfig(
+		fmt.Sprintf("per-user metric metadata limit of %d exceeded", limit),
+		validation.MaxMetadataPerUserFlag,
+	)
+	require.Equal(t, expectedErrMsg, err.Error())
+	checkIngesterError(t, err, badData)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &perUserMetadataLimitReachedError{})
+	checkIngesterError(t, wrappedErr, badData)
+}
+
+func TestNewPerMetricSeriesLimitError(t *testing.T) {
+	limit := 100
+	labels := mimirpb.FromLabelAdaptersToLabels(
+		[]mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "testmetric"}, {Name: "foo", Value: "biz"}},
+	)
+	err := newPerMetricSeriesLimitReachedError(limit, labels)
+	expectedErrMsg := fmt.Sprintf("%s This is for series %s",
+		globalerror.MaxSeriesPerMetric.MessageWithPerTenantLimitConfig(
+			fmt.Sprintf("per-metric series limit of %d exceeded", limit),
+			validation.MaxSeriesPerMetricFlag,
+		),
+		labels.String(),
+	)
+	require.Equal(t, expectedErrMsg, err.Error())
+	checkIngesterError(t, err, badData)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &perMetricSeriesLimitReachedError{})
+	checkIngesterError(t, wrappedErr, badData)
+}
+
+func TestNewPerMetricMetadataLimitError(t *testing.T) {
+	limit := 100
+	labels := mimirpb.FromLabelAdaptersToLabels(
+		[]mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "testmetric"}, {Name: "foo", Value: "biz"}},
+	)
+	err := newPerMetricMetadataLimitReachedError(limit, labels)
+	expectedErrMsg := fmt.Sprintf("%s This is for series %s",
+		globalerror.MaxMetadataPerMetric.MessageWithPerTenantLimitConfig(
+			fmt.Sprintf("per-metric metadata limit of %d exceeded", limit),
+			validation.MaxMetadataPerMetricFlag,
+		),
+		labels.String(),
+	)
+	require.Equal(t, expectedErrMsg, err.Error())
+	checkIngesterError(t, err, badData)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &perMetricMetadataLimitReachedError{})
+	checkIngesterError(t, wrappedErr, badData)
+}
+
+func TestNewSampleError(t *testing.T) {
+	seriesLabels := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
 	tests := map[string]struct {
-		err error
-		msg string
+		err         error
+		expectedMsg string
 	}{
-		"newIngestErrSampleTimestampTooOld": {
-			err: newIngestErrSampleTimestampTooOld(timestamp, metricLabelAdapters),
-			msg: `the sample has been rejected because its timestamp is too old (err-mimir-sample-timestamp-too-old). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
+		"newSampleTimestampTooOldError": {
+			err:         newSampleTimestampTooOldError(timestamp, seriesLabels),
+			expectedMsg: `the sample has been rejected because its timestamp is too old (err-mimir-sample-timestamp-too-old). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
 		},
-		"newIngestErrSampleTimestampTooOld_out_of_order_enabled": {
-			err: newIngestErrSampleTimestampTooOldOOOEnabled(timestamp, metricLabelAdapters, 2*time.Hour),
-			msg: `the sample has been rejected because another sample with a more recent timestamp has already been ingested and this sample is beyond the out-of-order time window of 2h (err-mimir-sample-timestamp-too-old). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
+		"newSampleTimestampTooOldOOOEnabledError": {
+			err:         newSampleTimestampTooOldOOOEnabledError(timestamp, seriesLabels, 2*time.Hour),
+			expectedMsg: `the sample has been rejected because another sample with a more recent timestamp has already been ingested and this sample is beyond the out-of-order time window of 2h (err-mimir-sample-timestamp-too-old). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
 		},
-		"newIngestErrSampleOutOfOrder": {
-			err: newIngestErrSampleOutOfOrder(timestamp, metricLabelAdapters),
-			msg: `the sample has been rejected because another sample with a more recent timestamp has already been ingested and out-of-order samples are not allowed (err-mimir-sample-out-of-order). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
+		"newSampleTimestampTooFarInFutureError": {
+			err:         newSampleTimestampTooFarInFutureError(timestamp, seriesLabels),
+			expectedMsg: `received a sample whose timestamp is too far in the future (err-mimir-too-far-in-future). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
 		},
-		"newIngestErrSampleDuplicateTimestamp": {
-			err: newIngestErrSampleDuplicateTimestamp(timestamp, metricLabelAdapters),
-			msg: `the sample has been rejected because another sample with the same timestamp, but a different value, has already been ingested (err-mimir-sample-duplicate-timestamp). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
+		"newSampleOutOfOrderError": {
+			err:         newSampleOutOfOrderError(timestamp, seriesLabels),
+			expectedMsg: `the sample has been rejected because another sample with a more recent timestamp has already been ingested and out-of-order samples are not allowed (err-mimir-sample-out-of-order). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
 		},
-		"newIngestErrExemplarMissingSeries": {
-			err: newIngestErrExemplarMissingSeries(timestamp, metricLabelAdapters, []mimirpb.LabelAdapter{{Name: "traceID", Value: "123"}}),
-			msg: `the exemplar has been rejected because the related series has not been ingested yet (err-mimir-exemplar-series-missing). The affected exemplar is {traceID="123"} with timestamp 1970-01-19T05:30:43.969Z for series {__name__="test"}`,
+		"newSampleDuplicateTimestampError": {
+			err:         newSampleDuplicateTimestampError(timestamp, seriesLabels),
+			expectedMsg: `the sample has been rejected because another sample with the same timestamp, but a different value, has already been ingested (err-mimir-sample-duplicate-timestamp). The affected sample has timestamp 1970-01-19T05:30:43.969Z and is from series {__name__="test"}`,
 		},
 	}
 
 	for testName, tc := range tests {
 		t.Run(testName, func(t *testing.T) {
-			assert.Equal(t, tc.msg, tc.err.Error())
-			var safe safeToWrap
-			assert.ErrorAs(t, tc.err, &safe)
+			require.Equal(t, tc.expectedMsg, tc.err.Error())
+			checkIngesterError(t, tc.err, badData)
+
+			wrappedErr := wrapOrAnnotateWithUser(tc.err, userID)
+			require.ErrorIs(t, wrappedErr, tc.err)
+			var sampleErr sampleError
+			require.ErrorAs(t, wrappedErr, &sampleErr)
+			checkIngesterError(t, wrappedErr, badData)
 		})
 	}
 }
 
-func TestSafeToWrapError(t *testing.T) {
-	err := safeToWrapError("this is a safe to wrap error")
-	require.Error(t, err)
-	var safe safeToWrap
-	require.ErrorAs(t, err, &safe)
+func TestNewExemplarError(t *testing.T) {
+	seriesLabels := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
+	exemplarsLabels := []mimirpb.LabelAdapter{{Name: "traceID", Value: "123"}}
+	tests := map[string]struct {
+		err         error
+		expectedMsg string
+	}{
+		"newExemplarMissingSeriesError": {
+			err:         newExemplarMissingSeriesError(timestamp, seriesLabels, exemplarsLabels),
+			expectedMsg: `the exemplar has been rejected because the related series has not been ingested yet (err-mimir-exemplar-series-missing). The affected exemplar is {traceID="123"} with timestamp 1970-01-19T05:30:43.969Z for series {__name__="test"}`,
+		},
+		"newExemplarTimestampTooFarInFutureError": {
+			err:         newExemplarTimestampTooFarInFutureError(timestamp, seriesLabels, exemplarsLabels),
+			expectedMsg: `received an exemplar whose timestamp is too far in the future (err-mimir-exemplar-too-far-in-future). The affected exemplar is {traceID="123"} with timestamp 1970-01-19T05:30:43.969Z for series {__name__="test"}`,
+		},
+	}
+
+	for testName, tc := range tests {
+		t.Run(testName, func(t *testing.T) {
+			require.Equal(t, tc.expectedMsg, tc.err.Error())
+			checkIngesterError(t, tc.err, badData)
+
+			wrappedErr := wrapOrAnnotateWithUser(tc.err, userID)
+			require.ErrorIs(t, wrappedErr, tc.err)
+			var exemplarErr exemplarError
+			require.ErrorAs(t, wrappedErr, &exemplarErr)
+			checkIngesterError(t, wrappedErr, badData)
+		})
+	}
+}
+
+func TestNewTSDBIngestExemplarErr(t *testing.T) {
+	seriesLabels := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
+	exemplarsLabels := []mimirpb.LabelAdapter{{Name: "traceID", Value: "123"}}
+	anotherErr := errors.New("another error")
+	err := newTSDBIngestExemplarErr(anotherErr, timestamp, seriesLabels, exemplarsLabels)
+	expectedErrMsg := fmt.Sprintf("err: %v. timestamp=1970-01-19T05:30:43.969Z, series={__name__=\"test\"}, exemplar={traceID=\"123\"}", anotherErr)
+	require.Equal(t, expectedErrMsg, err.Error())
+	checkIngesterError(t, err, badData)
+
+	wrappedErr := wrapOrAnnotateWithUser(err, userID)
+	require.ErrorIs(t, wrappedErr, err)
+	require.ErrorAs(t, wrappedErr, &tsdbIngestExemplarErr{})
+	checkIngesterError(t, wrappedErr, badData)
 }
 
 func TestErrorWithStatus(t *testing.T) {
 	metricLabelAdapters := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
-	err := newIngestErrSampleTimestampTooOld(timestamp, metricLabelAdapters)
+	err := newSampleTimestampTooOldError(timestamp, metricLabelAdapters)
 	errWithStatus := newErrorWithStatus(err, codes.Unavailable)
 	require.Error(t, errWithStatus)
 	stat, ok := status.FromError(errWithStatus)
@@ -81,7 +248,7 @@ func TestErrorWithStatus(t *testing.T) {
 
 func TestErrorWithHTTPStatus(t *testing.T) {
 	metricLabelAdapters := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
-	err := newIngestErrSampleTimestampTooOld(timestamp, metricLabelAdapters)
+	err := newSampleTimestampTooOldError(timestamp, metricLabelAdapters)
 	errWithHTTPStatus := newErrorWithHTTPStatus(err, http.StatusBadRequest)
 	require.Error(t, errWithHTTPStatus)
 	stat, ok := status.FromError(errWithHTTPStatus)
@@ -97,15 +264,26 @@ func TestErrorWithHTTPStatus(t *testing.T) {
 
 func TestWrapOrAnnotateWithUser(t *testing.T) {
 	userID := "1"
-	unsafeErr := errors.New("this is an unsafe error")
-	safeErr := safeToWrapError("this is a safe error")
-
-	annotatedUnsafeErr := wrapOrAnnotateWithUser(unsafeErr, userID)
+	annotatingErr := errors.New("this error will be annotated")
+	expectedAnnotatedErrMsg := fmt.Sprintf("user=%s: %s", userID, annotatingErr.Error())
+	annotatedUnsafeErr := wrapOrAnnotateWithUser(annotatingErr, userID)
 	require.Error(t, annotatedUnsafeErr)
-	require.NotErrorIs(t, annotatedUnsafeErr, unsafeErr)
+	require.EqualError(t, annotatedUnsafeErr, expectedAnnotatedErrMsg)
+	require.NotErrorIs(t, annotatedUnsafeErr, annotatingErr)
 	require.Nil(t, errors.Unwrap(annotatedUnsafeErr))
 
-	wrappedSafeErr := wrapOrAnnotateWithUser(safeErr, userID)
+	metricLabelAdapters := []mimirpb.LabelAdapter{{Name: labels.MetricName, Value: "test"}}
+	wrappingErr := newSampleTimestampTooOldError(timestamp, metricLabelAdapters)
+	expectedWrappedErrMsg := fmt.Sprintf("user=%s: %s", userID, wrappingErr.Error())
+	wrappedSafeErr := wrapOrAnnotateWithUser(wrappingErr, userID)
 	require.Error(t, wrappedSafeErr)
-	require.ErrorIs(t, wrappedSafeErr, safeErr)
+	require.EqualError(t, wrappedSafeErr, expectedWrappedErrMsg)
+	require.ErrorIs(t, wrappedSafeErr, wrappingErr)
+	require.Equal(t, wrappingErr, errors.Unwrap(wrappedSafeErr))
+}
+
+func checkIngesterError(t *testing.T, err error, expectedType ingesterErrorType) {
+	var ingesterErr ingesterError
+	require.ErrorAs(t, err, &ingesterErr)
+	require.Equal(t, expectedType, ingesterErr.errorType())
 }