From b323f6bb1f76755ac59a2195f7f616bb50b21743 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Thu, 21 May 2026 14:41:50 +0530
Subject: [PATCH 1/8] feat: add check_http_metrics task for metric testing

---
 go.mod                                 |   8 +-
 pkg/tasks/check_http_metrics/config.go | 234 ++++++++++
 pkg/tasks/check_http_metrics/task.go   | 586 +++++++++++++++++++++++++
 3 files changed, 824 insertions(+), 4 deletions(-)
 create mode 100644 pkg/tasks/check_http_metrics/config.go
 create mode 100644 pkg/tasks/check_http_metrics/task.go

diff --git a/go.mod b/go.mod
index da345659..fa157225 100644
--- a/go.mod
+++ b/go.mod
@@ -4,6 +4,7 @@ go 1.25.7
 
 require (
 	github.com/donovanhide/eventsource v0.0.0-20210830082556-c59027999da0
+	github.com/dustin/go-humanize v1.0.1
 	github.com/ethereum/go-ethereum v1.17.3-0.20260421080339-499762852cf2
 	github.com/ethpandaops/ethwallclock v0.4.0
 	github.com/ethpandaops/go-eth2-client v0.1.2
@@ -23,10 +24,13 @@ require (
 	github.com/mashingan/smapping v0.1.19
 	github.com/pressly/goose/v3 v3.27.1
 	github.com/prometheus/client_golang v1.23.2
+	github.com/prometheus/client_model v0.6.2
+	github.com/prometheus/common v0.66.1
 	github.com/protolambda/zrnt v0.34.1
 	github.com/protolambda/ztyp v0.2.2
 	github.com/prysmaticlabs/go-bitfield v0.0.0-20240618144021-706c95b2dd15
 	github.com/rs/zerolog v1.35.1
+	github.com/santhosh-tekuri/jsonschema/v5 v5.3.1
 	github.com/sirupsen/logrus v1.9.4
 	github.com/spf13/cobra v1.10.2
 	github.com/spf13/pflag v1.0.10
@@ -57,7 +61,6 @@ require (
 	github.com/crate-crypto/go-eth-kzg v1.5.0 // indirect
 	github.com/deckarep/golang-set/v2 v2.6.0 // indirect
 	github.com/decred/dcrd/dcrec/secp256k1/v4 v4.3.0 // indirect
-	github.com/dustin/go-humanize v1.0.1 // indirect
 	github.com/emicklei/dot v1.6.4 // indirect
 	github.com/ethereum/c-kzg-4844/v2 v2.1.6 // indirect
 	github.com/ferranbt/fastssz v0.1.4 // indirect
@@ -89,13 +92,10 @@ require (
 	github.com/pk910/dynamic-ssz v1.3.2-0.20260505131440-111bcb265c8f // indirect
 	github.com/pk910/hashtree-bindings v0.1.0 // indirect
 	github.com/pkg/errors v0.9.1 // indirect
-	github.com/prometheus/client_model v0.6.2 // indirect
-	github.com/prometheus/common v0.66.1 // indirect
 	github.com/prometheus/procfs v0.20.1 // indirect
 	github.com/protolambda/bls12-381-util v0.1.0 // indirect
 	github.com/r3labs/sse/v2 v2.10.0 // indirect
 	github.com/remyoudompheng/bigfft v0.0.0-20230129092748-24d4a6f8daec // indirect
-	github.com/santhosh-tekuri/jsonschema/v5 v5.3.1 // indirect
 	github.com/sethvargo/go-retry v0.3.0 // indirect
 	github.com/shirou/gopsutil v3.21.11+incompatible // indirect
 	github.com/supranational/blst v0.3.16 // indirect
diff --git a/pkg/tasks/check_http_metrics/config.go b/pkg/tasks/check_http_metrics/config.go
new file mode 100644
index 00000000..84c67a7c
--- /dev/null
+++ b/pkg/tasks/check_http_metrics/config.go
@@ -0,0 +1,234 @@
+package checkhttpmetrics
+
+import (
+	"fmt"
+	"math"
+	"time"
+
+	"github.com/dustin/go-humanize"
+	"github.com/ethpandaops/assertoor/pkg/helper"
+)
+
+// MissingBehavior controls what happens when a metric or series cannot be found.
+// "wait" keeps polling, "fail" marks the assertion as failed, "pass" treats it as passed.
+type MissingBehavior string
+
+const (
+	MissingBehaviorWait MissingBehavior = "wait"
+	MissingBehaviorFail MissingBehavior = "fail"
+	MissingBehaviorPass MissingBehavior = "pass"
+
+	// DefaultMaxResponseSize is the default maximum response body size for metrics scraping.
+	DefaultMaxResponseSize = "10MB"
+)
+
+// ResetBehavior controls what happens when a counter value drops below its baseline,
+// which typically indicates a service restart or counter reset.
+type ResetBehavior string
+
+const (
+	ResetBehaviorFail       ResetBehavior = "fail"
+	ResetBehaviorRebaseline ResetBehavior = "rebaseline"
+	ResetBehaviorIgnore     ResetBehavior = "ignore"
+)
+
+// AssertionMode determines whether to compare the raw metric value or the change since baseline.
+// Delta mode requires at least two scrapes: one to record baseline, one to evaluate.
+type AssertionMode string
+
+const (
+	AssertionModeValue AssertionMode = "value"
+	AssertionModeDelta AssertionMode = "delta"
+)
+
+// Operator specifies the comparison operation between actual and expected values.
+type Operator string
+
+const (
+	OperatorEq  Operator = "eq"
+	OperatorNeq Operator = "neq"
+	OperatorGt  Operator = "gt"
+	OperatorGte Operator = "gte"
+	OperatorLt  Operator = "lt"
+	OperatorLte Operator = "lte"
+)
+
+// AssertionConfig defines a single metric assertion to evaluate.
+// Labels must match exactly one time series; matching zero or multiple series is an error.
+type AssertionConfig struct {
+	Name          string            `yaml:"name" json:"name" desc:"Unique human-readable assertion name."`
+	Metric        string            `yaml:"metric" json:"metric" desc:"Prometheus metric name."`
+	Labels        map[string]string `yaml:"labels" json:"labels" desc:"Exact label match for the time series."`
+	Mode          AssertionMode     `yaml:"mode" json:"mode" desc:"Evaluation mode: 'value' (current value) or 'delta' (change since baseline)."`
+	Operator      Operator          `yaml:"operator" json:"operator" desc:"Comparison operator: eq, neq, gt, gte, lt, lte."`
+	Value         float64           `yaml:"value" json:"value" desc:"Expected value for comparison."`
+	MissingMetric *MissingBehavior  `yaml:"missingMetric" json:"missingMetric,omitempty" desc:"Override global missingMetric behavior for this assertion."`
+	MissingSeries *MissingBehavior  `yaml:"missingSeries" json:"missingSeries,omitempty" desc:"Override global missingSeries behavior for this assertion."`
+}
+
+// Config holds the task configuration for scraping a Prometheus metrics endpoint
+// and evaluating assertions against the scraped values.
+type Config struct {
+	URL             string            `yaml:"url" json:"url" desc:"HTTP URL of the Prometheus metrics endpoint."`
+	Headers         map[string]string `yaml:"headers" json:"headers" desc:"Optional HTTP request headers."`
+	PollInterval    helper.Duration   `yaml:"pollInterval" json:"pollInterval" desc:"Interval between metric scrapes."`
+	RequestTimeout  helper.Duration   `yaml:"requestTimeout" json:"requestTimeout" desc:"Timeout for a single HTTP request."`
+	MaxResponseSize string            `yaml:"maxResponseSize" json:"maxResponseSize" desc:"Maximum response body size (e.g., '10MB')."`
+	FailOnCheckMiss bool              `yaml:"failOnCheckMiss" json:"failOnCheckMiss" desc:"If true, fail immediately when assertions are not met."`
+	ContinueOnPass  bool              `yaml:"continueOnPass" json:"continueOnPass" desc:"If true, continue checking after all assertions pass."`
+	MissingMetric   MissingBehavior   `yaml:"missingMetric" json:"missingMetric" desc:"Behavior when metric doesn't exist: wait, fail, pass."`
+	MissingSeries   MissingBehavior   `yaml:"missingSeries" json:"missingSeries" desc:"Behavior when no series matches labels: wait, fail, pass."`
+	ResetBehavior   ResetBehavior     `yaml:"resetBehavior" json:"resetBehavior" desc:"Behavior on counter reset in delta mode: fail, rebaseline, ignore."`
+	Assertions      []AssertionConfig `yaml:"assertions" json:"assertions" desc:"List of metric assertions to evaluate."`
+
+	// Parsed values (not from YAML)
+	maxResponseSizeBytes int64
+}
+
+func DefaultConfig() Config {
+	return Config{
+		PollInterval:    helper.Duration{Duration: 10 * time.Second},
+		RequestTimeout:  helper.Duration{Duration: 5 * time.Second},
+		MaxResponseSize: DefaultMaxResponseSize,
+		MissingMetric:   MissingBehaviorWait,
+		MissingSeries:   MissingBehaviorWait,
+		ResetBehavior:   ResetBehaviorFail,
+	}
+}
+
+func (c *Config) Validate() error {
+	if c.URL == "" {
+		return fmt.Errorf("url is required")
+	}
+
+	if len(c.Assertions) == 0 {
+		return fmt.Errorf("at least one assertion is required")
+	}
+
+	// Validate intervals to prevent tight-loops or disabled timeouts
+	if c.PollInterval.Duration <= 0 {
+		return fmt.Errorf("pollInterval must be positive")
+	}
+
+	if c.RequestTimeout.Duration <= 0 {
+		return fmt.Errorf("requestTimeout must be positive")
+	}
+
+	// Parse max response size
+	if c.MaxResponseSize != "" {
+		size, err := humanize.ParseBytes(c.MaxResponseSize)
+		if err != nil {
+			return fmt.Errorf("invalid maxResponseSize %q: %w", c.MaxResponseSize, err)
+		}
+
+		if size == 0 {
+			return fmt.Errorf("maxResponseSize must be positive")
+		}
+
+		if size > math.MaxInt64 {
+			return fmt.Errorf("maxResponseSize %q exceeds maximum allowed value", c.MaxResponseSize)
+		}
+
+		c.maxResponseSizeBytes = int64(size)
+	}
+
+	// Validate assertions and check for duplicate names
+	seenNames := make(map[string]bool, len(c.Assertions))
+
+	for i, a := range c.Assertions {
+		if a.Name == "" {
+			return fmt.Errorf("assertion[%d]: name is required", i)
+		}
+
+		if seenNames[a.Name] {
+			return fmt.Errorf("assertion[%d]: duplicate name %q", i, a.Name)
+		}
+
+		seenNames[a.Name] = true
+
+		if a.Metric == "" {
+			return fmt.Errorf("assertion[%d] %q: metric is required", i, a.Name)
+		}
+
+		if err := validateMode(a.Mode); err != nil {
+			return fmt.Errorf("assertion[%d] %q: %w", i, a.Name, err)
+		}
+
+		if err := validateOperator(a.Operator); err != nil {
+			return fmt.Errorf("assertion[%d] %q: %w", i, a.Name, err)
+		}
+
+		if a.MissingMetric != nil {
+			if err := validateMissingBehavior(*a.MissingMetric); err != nil {
+				return fmt.Errorf("assertion[%d] %q: missingMetric: %w", i, a.Name, err)
+			}
+		}
+
+		if a.MissingSeries != nil {
+			if err := validateMissingBehavior(*a.MissingSeries); err != nil {
+				return fmt.Errorf("assertion[%d] %q: missingSeries: %w", i, a.Name, err)
+			}
+		}
+	}
+
+	// Validate global enums
+	if err := validateMissingBehavior(c.MissingMetric); err != nil {
+		return fmt.Errorf("missingMetric: %w", err)
+	}
+
+	if err := validateMissingBehavior(c.MissingSeries); err != nil {
+		return fmt.Errorf("missingSeries: %w", err)
+	}
+
+	if err := validateResetBehavior(c.ResetBehavior); err != nil {
+		return fmt.Errorf("resetBehavior: %w", err)
+	}
+
+	return nil
+}
+
+func (c *Config) GetMaxResponseSizeBytes() int64 {
+	if c.maxResponseSizeBytes == 0 {
+		return 10 * 1024 * 1024 // 10MB default
+	}
+
+	return c.maxResponseSizeBytes
+}
+
+func validateMissingBehavior(b MissingBehavior) error {
+	switch b {
+	case MissingBehaviorWait, MissingBehaviorFail, MissingBehaviorPass, "":
+		return nil
+	default:
+		return fmt.Errorf("invalid value %q, must be one of: wait, fail, pass", b)
+	}
+}
+
+func validateResetBehavior(b ResetBehavior) error {
+	switch b {
+	case ResetBehaviorFail, ResetBehaviorRebaseline, ResetBehaviorIgnore, "":
+		return nil
+	default:
+		return fmt.Errorf("invalid value %q, must be one of: fail, rebaseline, ignore", b)
+	}
+}
+
+func validateMode(m AssertionMode) error {
+	switch m {
+	case AssertionModeValue, AssertionModeDelta, "":
+		return nil
+	default:
+		return fmt.Errorf("invalid mode %q, must be one of: value, delta", m)
+	}
+}
+
+func validateOperator(o Operator) error {
+	switch o {
+	case OperatorEq, OperatorNeq, OperatorGt, OperatorGte, OperatorLt, OperatorLte:
+		return nil
+	case "":
+		return fmt.Errorf("operator is required")
+	default:
+		return fmt.Errorf("invalid operator %q, must be one of: eq, neq, gt, gte, lt, lte", o)
+	}
+}
diff --git a/pkg/tasks/check_http_metrics/task.go b/pkg/tasks/check_http_metrics/task.go
new file mode 100644
index 00000000..8843579c
--- /dev/null
+++ b/pkg/tasks/check_http_metrics/task.go
@@ -0,0 +1,586 @@
+package checkhttpmetrics
+
+import (
+	"context"
+	"errors"
+	"fmt"
+	"io"
+	"math"
+	"net/http"
+	"strings"
+	"time"
+
+	"github.com/ethpandaops/assertoor/pkg/types"
+	"github.com/ethpandaops/assertoor/pkg/vars"
+	dto "github.com/prometheus/client_model/go"
+	"github.com/prometheus/common/expfmt"
+	"github.com/prometheus/common/model"
+	"github.com/sirupsen/logrus"
+)
+
+const outputTypeObject = "object"
+
+var (
+	TaskName       = "check_http_metrics"
+	TaskDescriptor = &types.TaskDescriptor{
+		Name:        TaskName,
+		Description: "Checks HTTP Prometheus metrics endpoint and evaluates assertions against metric values.",
+		Category:    "utility",
+		Config:      DefaultConfig(),
+		Outputs: []types.TaskOutputDefinition{
+			{
+				Name:        "passedAssertions",
+				Type:        "array",
+				Description: "Array of assertion names that passed.",
+			},
+			{
+				Name:        "failedAssertions",
+				Type:        "array",
+				Description: "Array of assertion names that failed.",
+			},
+			{
+				Name:        "values",
+				Type:        outputTypeObject,
+				Description: "Map of assertion name to latest observed value.",
+			},
+			{
+				Name:        "deltas",
+				Type:        outputTypeObject,
+				Description: "Map of assertion name to computed delta for delta-mode assertions.",
+			},
+			{
+				Name:        "baselines",
+				Type:        outputTypeObject,
+				Description: "Map of assertion name to baseline value for delta-mode assertions.",
+			},
+			{
+				Name:        "scrapeErrors",
+				Type:        "int",
+				Description: "Number of HTTP/parsing errors encountered.",
+			},
+			{
+				Name:        "assertionErrors",
+				Type:        "int",
+				Description: "Number of assertion evaluation errors.",
+			},
+		},
+		NewTask: NewTask,
+	}
+)
+
+type Task struct {
+	ctx        *types.TaskContext
+	options    *types.TaskOptions
+	config     Config
+	logger     logrus.FieldLogger
+	httpClient *http.Client
+
+	// State
+	baselines       map[string]float64
+	scrapeCount     int
+	scrapeErrors    int
+	assertionErrors int
+}
+
+func NewTask(ctx *types.TaskContext, options *types.TaskOptions) (types.Task, error) {
+	return &Task{
+		ctx:       ctx,
+		options:   options,
+		logger:    ctx.Logger.GetLogger(),
+		baselines: make(map[string]float64, 8),
+	}, nil
+}
+
+func (t *Task) Config() interface{} {
+	return t.config
+}
+
+func (t *Task) Timeout() time.Duration {
+	return t.options.Timeout.Duration
+}
+
+func (t *Task) LoadConfig() error {
+	config := DefaultConfig()
+
+	// parse static config
+	if t.options.Config != nil {
+		if err := t.options.Config.Unmarshal(&config); err != nil {
+			return fmt.Errorf("error parsing task config for %v: %w", TaskName, err)
+		}
+	}
+
+	// load dynamic vars
+	if err := t.ctx.Vars.ConsumeVars(&config, t.options.ConfigVars); err != nil {
+		return err
+	}
+
+	// validate config
+	if err := config.Validate(); err != nil {
+		return err
+	}
+
+	t.config = config
+
+	t.httpClient = &http.Client{
+		Timeout: config.RequestTimeout.Duration,
+	}
+
+	return nil
+}
+
+func (t *Task) Execute(ctx context.Context) error {
+	for {
+		t.scrapeCount++
+
+		done, err := t.runCheck(ctx)
+		if done {
+			return err
+		}
+
+		select {
+		case <-time.After(t.config.PollInterval.Duration):
+		case <-ctx.Done():
+			return ctx.Err()
+		}
+	}
+}
+
+type assertionResult struct {
+	name    string
+	passed  bool
+	value   float64
+	delta   float64
+	err     error
+	waiting bool // true if we should keep waiting (missing metric/series with wait behavior)
+}
+
+func (t *Task) runCheck(ctx context.Context) (bool, error) {
+	// Scrape metrics
+	metricFamilies, err := t.scrapeMetrics(ctx)
+	if err != nil {
+		t.scrapeErrors++
+		t.logger.Warnf("Scrape error (attempt %d): %v", t.scrapeCount, err)
+
+		if t.config.FailOnCheckMiss {
+			t.ctx.SetResult(types.TaskResultFailure)
+			t.setOutputs(nil)
+
+			return true, fmt.Errorf("scrape failed: %w", err)
+		}
+
+		t.ctx.SetResult(types.TaskResultNone)
+		t.ctx.ReportProgress(0, fmt.Sprintf("Scrape failed, retrying... (attempt %d)", t.scrapeCount))
+		t.setOutputs(nil) // Update outputs so scrapeErrors is visible
+
+		return false, nil
+	}
+
+	// Evaluate assertions
+	results := t.evaluateAssertions(metricFamilies)
+
+	// Collect results
+	var passedAssertions, failedAssertions []string
+
+	var anyWaiting, anyFailed bool
+
+	values := make(map[string]float64, len(results))
+	deltas := make(map[string]float64, len(results))
+
+	for _, r := range results {
+		if !math.IsNaN(r.value) {
+			values[r.name] = r.value
+		}
+
+		if !math.IsNaN(r.delta) {
+			deltas[r.name] = r.delta
+		}
+
+		if r.waiting {
+			anyWaiting = true
+
+			continue
+		}
+
+		if r.err != nil {
+			t.assertionErrors++
+
+			failedAssertions = append(failedAssertions, r.name)
+			anyFailed = true
+
+			t.logger.Warnf("Assertion %q error: %v", r.name, r.err)
+
+			continue
+		}
+
+		if r.passed {
+			passedAssertions = append(passedAssertions, r.name)
+		} else {
+			failedAssertions = append(failedAssertions, r.name)
+			anyFailed = true
+		}
+	}
+
+	t.setOutputs(&checkOutputs{
+		passedAssertions: passedAssertions,
+		failedAssertions: failedAssertions,
+		values:           values,
+		deltas:           deltas,
+	})
+
+	// Determine result
+	allPassed := !anyFailed && !anyWaiting
+
+	switch {
+	case allPassed:
+		t.ctx.SetResult(types.TaskResultSuccess)
+		t.ctx.ReportProgress(100, fmt.Sprintf("All assertions passed (%d/%d)", len(passedAssertions), len(t.config.Assertions)))
+
+		if !t.config.ContinueOnPass {
+			return true, nil
+		}
+
+	case anyFailed && t.config.FailOnCheckMiss:
+		t.ctx.SetResult(types.TaskResultFailure)
+
+		return true, fmt.Errorf("assertions failed: %v", failedAssertions)
+
+	default:
+		t.ctx.SetResult(types.TaskResultNone)
+		t.ctx.ReportProgress(0, fmt.Sprintf("Waiting... passed=%d failed=%d waiting=%d (attempt %d)",
+			len(passedAssertions), len(failedAssertions), countWaiting(results), t.scrapeCount))
+	}
+
+	return false, nil
+}
+
+type checkOutputs struct {
+	passedAssertions []string
+	failedAssertions []string
+	values           map[string]float64
+	deltas           map[string]float64
+}
+
+func (t *Task) setOutputs(out *checkOutputs) {
+	if out == nil {
+		t.ctx.Outputs.SetVar("passedAssertions", []string{})
+		t.ctx.Outputs.SetVar("failedAssertions", []string{})
+		t.ctx.Outputs.SetVar("values", map[string]float64{})
+		t.ctx.Outputs.SetVar("deltas", map[string]float64{})
+	} else {
+		if data, err := vars.GeneralizeData(out.passedAssertions); err == nil {
+			t.ctx.Outputs.SetVar("passedAssertions", data)
+		}
+
+		if data, err := vars.GeneralizeData(out.failedAssertions); err == nil {
+			t.ctx.Outputs.SetVar("failedAssertions", data)
+		}
+
+		if data, err := vars.GeneralizeData(out.values); err == nil {
+			t.ctx.Outputs.SetVar("values", data)
+		}
+
+		if data, err := vars.GeneralizeData(out.deltas); err == nil {
+			t.ctx.Outputs.SetVar("deltas", data)
+		}
+	}
+
+	// Baselines
+	if data, err := vars.GeneralizeData(t.baselines); err == nil {
+		t.ctx.Outputs.SetVar("baselines", data)
+	}
+
+	t.ctx.Outputs.SetVar("scrapeErrors", t.scrapeErrors)
+	t.ctx.Outputs.SetVar("assertionErrors", t.assertionErrors)
+}
+
+func countWaiting(results []assertionResult) int {
+	count := 0
+
+	for _, r := range results {
+		if r.waiting {
+			count++
+		}
+	}
+
+	return count
+}
+
+func (t *Task) scrapeMetrics(ctx context.Context) (map[string]*dto.MetricFamily, error) {
+	req, err := http.NewRequestWithContext(ctx, http.MethodGet, t.config.URL, http.NoBody)
+	if err != nil {
+		return nil, fmt.Errorf("failed to create request: %w", err)
+	}
+
+	for k, v := range t.config.Headers {
+		req.Header.Set(k, v)
+	}
+
+	resp, err := t.httpClient.Do(req)
+	if err != nil {
+		return nil, fmt.Errorf("HTTP request failed: %w", err)
+	}
+	defer resp.Body.Close()
+
+	if resp.StatusCode != http.StatusOK {
+		return nil, fmt.Errorf("unexpected status code: %d", resp.StatusCode)
+	}
+
+	// Limit response size
+	maxSize := t.config.GetMaxResponseSizeBytes()
+	limitedReader := io.LimitReader(resp.Body, maxSize+1)
+
+	body, err := io.ReadAll(limitedReader)
+	if err != nil {
+		return nil, fmt.Errorf("failed to read response body: %w", err)
+	}
+
+	if int64(len(body)) > maxSize {
+		return nil, fmt.Errorf("response body exceeds max size of %d bytes", maxSize)
+	}
+
+	// Parse Prometheus text format using UTF8 validation scheme
+	parser := expfmt.NewTextParser(model.UTF8Validation)
+
+	metricFamilies, err := parser.TextToMetricFamilies(strings.NewReader(string(body)))
+	if err != nil {
+		return nil, fmt.Errorf("failed to parse metrics: %w", err)
+	}
+
+	return metricFamilies, nil
+}
+
+func (t *Task) evaluateAssertions(metricFamilies map[string]*dto.MetricFamily) []assertionResult {
+	results := make([]assertionResult, 0, len(t.config.Assertions))
+
+	for i := range t.config.Assertions {
+		result := t.evaluateAssertion(&t.config.Assertions[i], metricFamilies)
+		results = append(results, result)
+	}
+
+	return results
+}
+
+func (t *Task) evaluateAssertion(a *AssertionConfig, metricFamilies map[string]*dto.MetricFamily) assertionResult {
+	result := assertionResult{
+		name:  a.Name,
+		value: math.NaN(),
+		delta: math.NaN(),
+	}
+
+	// Get effective missing behaviors
+	missingMetricBehavior := t.config.MissingMetric
+	if a.MissingMetric != nil {
+		missingMetricBehavior = *a.MissingMetric
+	}
+
+	missingSeriesBehavior := t.config.MissingSeries
+	if a.MissingSeries != nil {
+		missingSeriesBehavior = *a.MissingSeries
+	}
+
+	// Find the metric family
+	mf, ok := metricFamilies[a.Metric]
+	if !ok {
+		return t.handleMissing(result, missingMetricBehavior, fmt.Sprintf("metric %q not found", a.Metric))
+	}
+
+	// Find matching series
+	value, err := t.findMetricValue(mf, a.Labels)
+	if err != nil {
+		if strings.Contains(err.Error(), "no matching series") {
+			return t.handleMissing(result, missingSeriesBehavior, err.Error())
+		}
+
+		result.err = err
+
+		return result
+	}
+
+	result.value = value
+
+	// Check for non-finite values
+	if math.IsNaN(value) || math.IsInf(value, 0) {
+		result.err = fmt.Errorf("metric value is non-finite: %v", value)
+
+		return result
+	}
+
+	// Handle delta mode
+	mode := a.Mode
+	if mode == "" {
+		mode = AssertionModeValue
+	}
+
+	var compareValue float64
+
+	if mode == AssertionModeDelta {
+		baseline, hasBaseline := t.baselines[a.Name]
+
+		if !hasBaseline {
+			// First scrape: record baseline, don't evaluate
+			t.baselines[a.Name] = value
+			result.waiting = true
+
+			t.logger.Debugf("Assertion %q: recorded baseline %.4f", a.Name, value)
+
+			return result
+		}
+
+		// Check for counter reset (only applies to COUNTER type, not gauges)
+		// Gauges can legitimately decrease, so negative delta is normal for them
+		isCounter := mf.GetType() == dto.MetricType_COUNTER
+		if isCounter && value < baseline {
+			switch t.config.ResetBehavior {
+			case ResetBehaviorFail:
+				result.err = fmt.Errorf("counter reset detected: current %.4f < baseline %.4f", value, baseline)
+
+				return result
+			case ResetBehaviorRebaseline:
+				t.baselines[a.Name] = value
+				t.logger.Warnf("Assertion %q: counter reset detected, rebaselining to %.4f", a.Name, value)
+
+				result.waiting = true
+
+				return result
+			case ResetBehaviorIgnore:
+				// Use old baseline, may produce negative delta
+				t.logger.Warnf("Assertion %q: counter reset detected, ignoring", a.Name)
+			}
+		}
+
+		compareValue = value - baseline
+		result.delta = compareValue
+	} else {
+		compareValue = value
+	}
+
+	// Evaluate operator
+	result.passed = evaluateOperator(a.Operator, compareValue, a.Value)
+
+	if !result.passed {
+		t.logger.Debugf("Assertion %q failed: %.4f %s %.4f = false", a.Name, compareValue, a.Operator, a.Value)
+	}
+
+	return result
+}
+
+func (t *Task) handleMissing(result assertionResult, behavior MissingBehavior, message string) assertionResult {
+	switch behavior {
+	case MissingBehaviorFail:
+		result.err = errors.New(message)
+	case MissingBehaviorPass:
+		result.passed = true
+	case MissingBehaviorWait:
+		result.waiting = true
+	default:
+		result.waiting = true
+	}
+
+	return result
+}
+
+func (t *Task) findMetricValue(mf *dto.MetricFamily, labels map[string]string) (float64, error) {
+	var matchingMetrics []*dto.Metric
+
+	for _, m := range mf.GetMetric() {
+		if matchLabels(m.GetLabel(), labels) {
+			matchingMetrics = append(matchingMetrics, m)
+		}
+	}
+
+	if len(matchingMetrics) == 0 {
+		return 0, fmt.Errorf("no matching series for labels %v", labels)
+	}
+
+	if len(matchingMetrics) > 1 {
+		return 0, fmt.Errorf("labels match %d series (must match exactly one)", len(matchingMetrics))
+	}
+
+	value, err := getMetricValue(matchingMetrics[0], mf.GetType())
+	if err != nil {
+		return 0, fmt.Errorf("failed to extract metric value: %w", err)
+	}
+
+	return value, nil
+}
+
+func matchLabels(metricLabels []*dto.LabelPair, wantLabels map[string]string) bool {
+	if len(wantLabels) == 0 {
+		return true
+	}
+
+	labelMap := make(map[string]string, len(metricLabels))
+
+	for _, lp := range metricLabels {
+		labelMap[lp.GetName()] = lp.GetValue()
+	}
+
+	for k, v := range wantLabels {
+		if labelMap[k] != v {
+			return false
+		}
+	}
+
+	return true
+}
+
+var errNoMetricValue = errors.New("metric has no extractable value")
+
+func getMetricValue(m *dto.Metric, mType dto.MetricType) (float64, error) {
+	switch mType {
+	case dto.MetricType_COUNTER:
+		if c := m.GetCounter(); c != nil {
+			return c.GetValue(), nil
+		}
+	case dto.MetricType_GAUGE:
+		if g := m.GetGauge(); g != nil {
+			return g.GetValue(), nil
+		}
+	case dto.MetricType_UNTYPED:
+		if u := m.GetUntyped(); u != nil {
+			return u.GetValue(), nil
+		}
+	case dto.MetricType_SUMMARY:
+		if s := m.GetSummary(); s != nil {
+			return s.GetSampleSum(), nil
+		}
+	case dto.MetricType_HISTOGRAM, dto.MetricType_GAUGE_HISTOGRAM:
+		if h := m.GetHistogram(); h != nil {
+			return h.GetSampleSum(), nil
+		}
+	}
+
+	// Fallback: try all types
+	if c := m.GetCounter(); c != nil {
+		return c.GetValue(), nil
+	}
+
+	if g := m.GetGauge(); g != nil {
+		return g.GetValue(), nil
+	}
+
+	if u := m.GetUntyped(); u != nil {
+		return u.GetValue(), nil
+	}
+
+	return 0, errNoMetricValue
+}
+
+func evaluateOperator(op Operator, actual, expected float64) bool {
+	switch op {
+	case OperatorEq:
+		return actual == expected
+	case OperatorNeq:
+		return actual != expected
+	case OperatorGt:
+		return actual > expected
+	case OperatorGte:
+		return actual >= expected
+	case OperatorLt:
+		return actual < expected
+	case OperatorLte:
+		return actual <= expected
+	default:
+		return false
+	}
+}

From 2a07622efcd21e59a1843a759d24417728d91bd3 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Thu, 21 May 2026 23:54:18 +0530
Subject: [PATCH 2/8] test: add unit test for check_http_metrics

---
 go.mod                                    |    2 +-
 pkg/tasks/check_http_metrics/task_test.go | 1604 +++++++++++++++++++++
 pkg/tasks/tasks.go                        |    2 +
 3 files changed, 1607 insertions(+), 1 deletion(-)
 create mode 100644 pkg/tasks/check_http_metrics/task_test.go

diff --git a/go.mod b/go.mod
index fa157225..13da7bbd 100644
--- a/go.mod
+++ b/go.mod
@@ -41,6 +41,7 @@ require (
 	github.com/wealdtech/go-eth2-types/v2 v2.8.2
 	github.com/wealdtech/go-eth2-util v1.8.2
 	golang.org/x/text v0.37.0
+	google.golang.org/protobuf v1.36.11
 	gopkg.in/yaml.v2 v2.4.0
 	gopkg.in/yaml.v3 v3.0.1
 )
@@ -118,7 +119,6 @@ require (
 	golang.org/x/sys v0.43.0 // indirect
 	golang.org/x/time v0.15.0 // indirect
 	golang.org/x/tools v0.44.0 // indirect
-	google.golang.org/protobuf v1.36.11 // indirect
 	gopkg.in/cenkalti/backoff.v1 v1.1.0 // indirect
 	modernc.org/libc v1.72.1 // indirect
 	modernc.org/mathutil v1.7.1 // indirect
diff --git a/pkg/tasks/check_http_metrics/task_test.go b/pkg/tasks/check_http_metrics/task_test.go
new file mode 100644
index 00000000..60aa924e
--- /dev/null
+++ b/pkg/tasks/check_http_metrics/task_test.go
@@ -0,0 +1,1604 @@
+package checkhttpmetrics
+
+import (
+	"context"
+	"math"
+	"net/http"
+	"net/http/httptest"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/ethpandaops/assertoor/pkg/helper"
+	"github.com/ethpandaops/assertoor/pkg/types"
+	"github.com/ethpandaops/assertoor/pkg/vars"
+	dto "github.com/prometheus/client_model/go"
+	"github.com/sirupsen/logrus"
+	"google.golang.org/protobuf/proto"
+)
+
+const (
+	testMetricsURL         = "http://localhost:9090/metrics"
+	testMetric1            = "metric1"
+	testLabelFoo           = "foo"
+	testLabelBar           = "bar"
+	testLabelEnv           = "env"
+	testLabelRegion        = "region"
+	testValueProd          = "prod"
+	testAssertionName      = "test"
+	testAssertionName2     = "test_assertion"
+	testInvalidOpLabel     = "invalid operator"
+	testResetName          = "reset_test"
+	testCounterMetric      = "test_counter"
+	testCheckCounterAssert = "check_counter"
+)
+
+// validBaseConfig returns a config with required fields set for validation to pass intervals check.
+func validBaseConfig() Config {
+	return Config{
+		PollInterval:   helper.Duration{Duration: 10 * time.Second},
+		RequestTimeout: helper.Duration{Duration: 5 * time.Second},
+	}
+}
+
+func TestConfig_Validate(t *testing.T) {
+	tests := []struct {
+		name       string
+		configFunc func() Config
+		wantErr    string
+	}{
+		{
+			name:       "missing url",
+			configFunc: func() Config { return Config{} },
+			wantErr:    "url is required",
+		},
+		{
+			name: "missing assertions",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+
+				return c
+			},
+			wantErr: "at least one assertion is required",
+		},
+		{
+			name: "missing assertion name",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.Assertions = []AssertionConfig{
+					{Metric: "test_metric", Operator: OperatorGt, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "assertion[0]: name is required",
+		},
+		{
+			name: "duplicate assertion names",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Operator: OperatorGt, Value: 0},
+					{Name: testAssertionName, Metric: "metric2", Operator: OperatorGt, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "assertion[1]: duplicate name",
+		},
+		{
+			name: testInvalidOpLabel,
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Operator: "invalid", Value: 0},
+				}
+
+				return c
+			},
+			wantErr: testInvalidOpLabel,
+		},
+		{
+			name: "missing operator",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "operator is required",
+		},
+		{
+			name: "invalid max response size",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.MaxResponseSize = "invalid"
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Operator: OperatorGt, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "invalid maxResponseSize",
+		},
+		{
+			name: "zero max response size",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.MaxResponseSize = "0B"
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Operator: OperatorGt, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "maxResponseSize must be positive",
+		},
+		{
+			name: "valid config",
+			configFunc: func() Config {
+				c := validBaseConfig()
+				c.URL = testMetricsURL
+				c.MaxResponseSize = "10MB"
+				c.MissingMetric = MissingBehaviorWait
+				c.MissingSeries = MissingBehaviorFail
+				c.ResetBehavior = ResetBehaviorFail
+				c.Assertions = []AssertionConfig{
+					{Name: testAssertionName, Metric: testMetric1, Operator: OperatorGt, Value: 0},
+				}
+
+				return c
+			},
+			wantErr: "",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			cfg := tt.configFunc()
+			err := cfg.Validate()
+
+			switch {
+			case tt.wantErr == "" && err != nil:
+				t.Fatalf("unexpected error: %v", err)
+			case tt.wantErr != "" && err == nil:
+				t.Fatalf("expected error containing %q, got nil", tt.wantErr)
+			case tt.wantErr != "" && !strings.Contains(err.Error(), tt.wantErr):
+				t.Fatalf("error %q does not contain %q", err.Error(), tt.wantErr)
+			}
+		})
+	}
+}
+
+func TestMatchLabels(t *testing.T) {
+	tests := []struct {
+		name         string
+		metricLabels []*dto.LabelPair
+		wantLabels   map[string]string
+		want         bool
+	}{
+		{
+			name:         "empty want labels matches anything",
+			metricLabels: []*dto.LabelPair{{Name: proto.String(testLabelFoo), Value: proto.String(testLabelBar)}},
+			wantLabels:   nil,
+			want:         true,
+		},
+		{
+			name:         "exact match",
+			metricLabels: []*dto.LabelPair{{Name: proto.String(testLabelFoo), Value: proto.String(testLabelBar)}},
+			wantLabels:   map[string]string{testLabelFoo: testLabelBar},
+			want:         true,
+		},
+		{
+			name: "partial match (subset of labels)",
+			metricLabels: []*dto.LabelPair{
+				{Name: proto.String(testLabelFoo), Value: proto.String(testLabelBar)},
+				{Name: proto.String("baz"), Value: proto.String("qux")},
+			},
+			wantLabels: map[string]string{testLabelFoo: testLabelBar},
+			want:       true,
+		},
+		{
+			name:         "no match - different value",
+			metricLabels: []*dto.LabelPair{{Name: proto.String(testLabelFoo), Value: proto.String(testLabelBar)}},
+			wantLabels:   map[string]string{testLabelFoo: "baz"},
+			want:         false,
+		},
+		{
+			name:         "no match - missing label",
+			metricLabels: []*dto.LabelPair{{Name: proto.String(testLabelFoo), Value: proto.String(testLabelBar)}},
+			wantLabels:   map[string]string{"missing": "label"},
+			want:         false,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			got := matchLabels(tt.metricLabels, tt.wantLabels)
+			if got != tt.want {
+				t.Errorf("matchLabels() = %v, want %v", got, tt.want)
+			}
+		})
+	}
+}
+
+func TestEvaluateOperator(t *testing.T) {
+	tests := []struct {
+		name     string
+		op       Operator
+		actual   float64
+		expected float64
+		want     bool
+	}{
+		{"eq true", OperatorEq, 5, 5, true},
+		{"eq false", OperatorEq, 5, 6, false},
+		{"neq true", OperatorNeq, 5, 6, true},
+		{"neq false", OperatorNeq, 5, 5, false},
+		{"gt true", OperatorGt, 6, 5, true},
+		{"gt false", OperatorGt, 5, 5, false},
+		{"gte true equal", OperatorGte, 5, 5, true},
+		{"gte true greater", OperatorGte, 6, 5, true},
+		{"gte false", OperatorGte, 4, 5, false},
+		{"lt true", OperatorLt, 4, 5, true},
+		{"lt false", OperatorLt, 5, 5, false},
+		{"lte true equal", OperatorLte, 5, 5, true},
+		{"lte true less", OperatorLte, 4, 5, true},
+		{"lte false", OperatorLte, 6, 5, false},
+		{testInvalidOpLabel, Operator("invalid"), 5, 5, false},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			got := evaluateOperator(tt.op, tt.actual, tt.expected)
+			if got != tt.want {
+				t.Errorf("evaluateOperator(%v, %v, %v) = %v, want %v", tt.op, tt.actual, tt.expected, got, tt.want)
+			}
+		})
+	}
+}
+
+func TestGetMetricValue(t *testing.T) {
+	counterVal := 42.0
+	gaugeVal := 3.14
+	untypedVal := 99.9
+	summarySum := 100.0
+	histogramSum := 200.0
+
+	tests := []struct {
+		name    string
+		metric  *dto.Metric
+		mType   dto.MetricType
+		want    float64
+		wantErr bool
+	}{
+		{
+			name:   "counter",
+			metric: &dto.Metric{Counter: &dto.Counter{Value: &counterVal}},
+			mType:  dto.MetricType_COUNTER,
+			want:   42.0,
+		},
+		{
+			name:   "gauge",
+			metric: &dto.Metric{Gauge: &dto.Gauge{Value: &gaugeVal}},
+			mType:  dto.MetricType_GAUGE,
+			want:   3.14,
+		},
+		{
+			name:   "untyped",
+			metric: &dto.Metric{Untyped: &dto.Untyped{Value: &untypedVal}},
+			mType:  dto.MetricType_UNTYPED,
+			want:   99.9,
+		},
+		{
+			name:   "summary returns sample sum",
+			metric: &dto.Metric{Summary: &dto.Summary{SampleSum: &summarySum}},
+			mType:  dto.MetricType_SUMMARY,
+			want:   100.0,
+		},
+		{
+			name:   "histogram returns sample sum",
+			metric: &dto.Metric{Histogram: &dto.Histogram{SampleSum: &histogramSum}},
+			mType:  dto.MetricType_HISTOGRAM,
+			want:   200.0,
+		},
+		{
+			name:   "fallback to counter when type unknown",
+			metric: &dto.Metric{Counter: &dto.Counter{Value: &counterVal}},
+			mType:  dto.MetricType(-1),
+			want:   42.0,
+		},
+		{
+			name:    "empty metric returns error",
+			metric:  &dto.Metric{},
+			mType:   dto.MetricType_COUNTER,
+			wantErr: true,
+		},
+		{
+			name:    "type mismatch with no fallback returns error",
+			metric:  &dto.Metric{},
+			mType:   dto.MetricType_GAUGE,
+			wantErr: true,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			got, err := getMetricValue(tt.metric, tt.mType)
+
+			if tt.wantErr {
+				if err == nil {
+					t.Fatalf("expected error, got nil")
+				}
+
+				return
+			}
+
+			if err != nil {
+				t.Fatalf("unexpected error: %v", err)
+			}
+
+			if got != tt.want {
+				t.Errorf("getMetricValue() = %v, want %v", got, tt.want)
+			}
+		})
+	}
+}
+
+func TestDefaultConfig(t *testing.T) {
+	cfg := DefaultConfig()
+
+	if cfg.MissingMetric != MissingBehaviorWait {
+		t.Errorf("MissingMetric = %v, want %v", cfg.MissingMetric, MissingBehaviorWait)
+	}
+
+	if cfg.MissingSeries != MissingBehaviorWait {
+		t.Errorf("MissingSeries = %v, want %v", cfg.MissingSeries, MissingBehaviorWait)
+	}
+
+	if cfg.ResetBehavior != ResetBehaviorFail {
+		t.Errorf("ResetBehavior = %v, want %v", cfg.ResetBehavior, ResetBehaviorFail)
+	}
+
+	if cfg.MaxResponseSize != "10MB" {
+		t.Errorf("MaxResponseSize = %v, want 10MB", cfg.MaxResponseSize)
+	}
+}
+
+func TestGetMaxResponseSizeBytes(t *testing.T) {
+	tests := []struct {
+		name string
+		cfg  Config
+		want int64
+	}{
+		{
+			name: "default when not set",
+			cfg:  Config{},
+			want: 10 * 1024 * 1024,
+		},
+		{
+			name: "parsed value",
+			cfg:  Config{MaxResponseSize: "5MB", maxResponseSizeBytes: 5 * 1024 * 1024},
+			want: 5 * 1024 * 1024,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			got := tt.cfg.GetMaxResponseSizeBytes()
+			if got != tt.want {
+				t.Errorf("GetMaxResponseSizeBytes() = %v, want %v", got, tt.want)
+			}
+		})
+	}
+}
+
+func TestValidateMissingBehavior(t *testing.T) {
+	validCases := []MissingBehavior{MissingBehaviorWait, MissingBehaviorFail, MissingBehaviorPass, ""}
+	for _, v := range validCases {
+		if err := validateMissingBehavior(v); err != nil {
+			t.Errorf("validateMissingBehavior(%q) returned unexpected error: %v", v, err)
+		}
+	}
+
+	if err := validateMissingBehavior("invalid"); err == nil {
+		t.Error("validateMissingBehavior(\"invalid\") expected error, got nil")
+	}
+}
+
+func TestValidateResetBehavior(t *testing.T) {
+	validCases := []ResetBehavior{ResetBehaviorFail, ResetBehaviorRebaseline, ResetBehaviorIgnore, ""}
+	for _, v := range validCases {
+		if err := validateResetBehavior(v); err != nil {
+			t.Errorf("validateResetBehavior(%q) returned unexpected error: %v", v, err)
+		}
+	}
+
+	if err := validateResetBehavior("invalid"); err == nil {
+		t.Error("validateResetBehavior(\"invalid\") expected error, got nil")
+	}
+}
+
+func TestValidateMode(t *testing.T) {
+	validCases := []AssertionMode{AssertionModeValue, AssertionModeDelta, ""}
+	for _, v := range validCases {
+		if err := validateMode(v); err != nil {
+			t.Errorf("validateMode(%q) returned unexpected error: %v", v, err)
+		}
+	}
+
+	if err := validateMode("invalid"); err == nil {
+		t.Error("validateMode(\"invalid\") expected error, got nil")
+	}
+}
+
+func TestValidateOperator(t *testing.T) {
+	validCases := []Operator{OperatorEq, OperatorNeq, OperatorGt, OperatorGte, OperatorLt, OperatorLte}
+	for _, v := range validCases {
+		if err := validateOperator(v); err != nil {
+			t.Errorf("validateOperator(%q) returned unexpected error: %v", v, err)
+		}
+	}
+
+	if err := validateOperator(""); err == nil {
+		t.Error("validateOperator(\"\") expected error, got nil")
+	}
+
+	if err := validateOperator("invalid"); err == nil {
+		t.Error("validateOperator(\"invalid\") expected error, got nil")
+	}
+}
+
+// newTestTask creates a Task for testing with a no-op logger.
+func newTestTask(cfg *Config) *Task {
+	logger := logrus.New()
+	logger.SetLevel(logrus.PanicLevel)
+
+	c := Config{}
+	if cfg != nil {
+		c = *cfg
+	}
+
+	return &Task{
+		config:    c,
+		logger:    logger,
+		baselines: make(map[string]float64),
+	}
+}
+
+// makeCounterFamily creates a COUNTER metric family with the given metrics.
+func makeCounterFamily(_ string, metrics ...*dto.Metric) *dto.MetricFamily {
+	mType := dto.MetricType_COUNTER
+
+	return &dto.MetricFamily{
+		Name:   proto.String(testMetric1),
+		Type:   &mType,
+		Metric: metrics,
+	}
+}
+
+// makeGaugeFamily creates a GAUGE metric family with the given metrics.
+func makeGaugeFamily(name string, metrics ...*dto.Metric) *dto.MetricFamily {
+	mType := dto.MetricType_GAUGE
+
+	return &dto.MetricFamily{
+		Name:   proto.String(name),
+		Type:   &mType,
+		Metric: metrics,
+	}
+}
+
+// makeCounter creates a counter metric with labels and value.
+func makeCounter(value float64, labels map[string]string) *dto.Metric {
+	m := &dto.Metric{
+		Counter: &dto.Counter{Value: proto.Float64(value)},
+	}
+
+	for k, v := range labels {
+		m.Label = append(m.Label, &dto.LabelPair{
+			Name:  proto.String(k),
+			Value: proto.String(v),
+		})
+	}
+
+	return m
+}
+
+// makeGauge creates a gauge metric with labels and value.
+func makeGauge(value float64, labels map[string]string) *dto.Metric {
+	m := &dto.Metric{
+		Gauge: &dto.Gauge{Value: proto.Float64(value)},
+	}
+
+	for k, v := range labels {
+		m.Label = append(m.Label, &dto.LabelPair{
+			Name:  proto.String(k),
+			Value: proto.String(v),
+		})
+	}
+
+	return m
+}
+
+// makeUntypedFamily creates an UNTYPED metric family with the given metrics.
+func makeUntypedFamily(name string, metrics ...*dto.Metric) *dto.MetricFamily {
+	mType := dto.MetricType_UNTYPED
+
+	return &dto.MetricFamily{
+		Name:   proto.String(name),
+		Type:   &mType,
+		Metric: metrics,
+	}
+}
+
+// makeUntyped creates an untyped metric with labels and value.
+func makeUntyped(value float64, labels map[string]string) *dto.Metric {
+	m := &dto.Metric{
+		Untyped: &dto.Untyped{Value: proto.Float64(value)},
+	}
+
+	for k, v := range labels {
+		m.Label = append(m.Label, &dto.LabelPair{
+			Name:  proto.String(k),
+			Value: proto.String(v),
+		})
+	}
+
+	return m
+}
+
+func TestFindMetricValue(t *testing.T) {
+	tests := []struct {
+		name      string
+		mf        *dto.MetricFamily
+		labels    map[string]string
+		wantValue float64
+		wantErr   string
+	}{
+		{
+			name:      "single series no labels",
+			mf:        makeCounterFamily(testMetric1, makeCounter(42, nil)),
+			labels:    nil,
+			wantValue: 42,
+		},
+		{
+			name: "single series with matching labels",
+			mf: makeCounterFamily(testMetric1, makeCounter(100, map[string]string{
+				testLabelEnv: testValueProd,
+			})),
+			labels:    map[string]string{testLabelEnv: testValueProd},
+			wantValue: 100,
+		},
+		{
+			name:    "no matching series",
+			mf:      makeCounterFamily(testMetric1, makeCounter(42, map[string]string{testLabelEnv: testValueProd})),
+			labels:  map[string]string{testLabelEnv: "dev"},
+			wantErr: "no matching series",
+		},
+		{
+			name: "multiple matching series error",
+			mf: makeCounterFamily(testMetric1,
+				makeCounter(10, map[string]string{testLabelEnv: testValueProd}),
+				makeCounter(20, map[string]string{testLabelEnv: testValueProd}),
+			),
+			labels:  map[string]string{testLabelEnv: testValueProd},
+			wantErr: "labels match 2 series",
+		},
+		{
+			name: "partial label match selects correct series",
+			mf: makeCounterFamily(testMetric1,
+				makeCounter(10, map[string]string{testLabelEnv: testValueProd, testLabelRegion: "us"}),
+				makeCounter(20, map[string]string{testLabelEnv: testValueProd, testLabelRegion: "eu"}),
+			),
+			labels:    map[string]string{testLabelEnv: testValueProd, testLabelRegion: "eu"},
+			wantValue: 20,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			task := newTestTask(&Config{})
+			val, err := task.findMetricValue(tt.mf, tt.labels)
+
+			switch {
+			case tt.wantErr != "" && err == nil:
+				t.Fatalf("expected error containing %q, got nil", tt.wantErr)
+			case tt.wantErr != "" && !strings.Contains(err.Error(), tt.wantErr):
+				t.Fatalf("error %q does not contain %q", err.Error(), tt.wantErr)
+			case tt.wantErr == "" && err != nil:
+				t.Fatalf("unexpected error: %v", err)
+			case tt.wantErr == "" && val != tt.wantValue:
+				t.Errorf("findMetricValue() = %v, want %v", val, tt.wantValue)
+			}
+		})
+	}
+}
+
+func TestHandleMissing(t *testing.T) {
+	tests := []struct {
+		name     string
+		behavior MissingBehavior
+		wantErr  bool
+		wantPass bool
+		wantWait bool
+	}{
+		{"fail behavior", MissingBehaviorFail, true, false, false},
+		{"pass behavior", MissingBehaviorPass, false, true, false},
+		{"wait behavior", MissingBehaviorWait, false, false, true},
+		{"empty defaults to wait", "", false, false, true},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			task := newTestTask(&Config{})
+			result := assertionResult{name: "test"}
+			result = task.handleMissing(result, tt.behavior, "metric not found")
+
+			if tt.wantErr && result.err == nil {
+				t.Error("expected error, got nil")
+			}
+
+			if !tt.wantErr && result.err != nil {
+				t.Errorf("unexpected error: %v", result.err)
+			}
+
+			if result.passed != tt.wantPass {
+				t.Errorf("passed = %v, want %v", result.passed, tt.wantPass)
+			}
+
+			if result.waiting != tt.wantWait {
+				t.Errorf("waiting = %v, want %v", result.waiting, tt.wantWait)
+			}
+		})
+	}
+}
+
+func TestEvaluateAssertion_MissingMetric(t *testing.T) {
+	tests := []struct {
+		name     string
+		behavior MissingBehavior
+		wantErr  bool
+		wantPass bool
+		wantWait bool
+	}{
+		{"wait on missing metric", MissingBehaviorWait, false, false, true},
+		{"fail on missing metric", MissingBehaviorFail, true, false, false},
+		{"pass on missing metric", MissingBehaviorPass, false, true, false},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			task := newTestTask(&Config{MissingMetric: tt.behavior})
+			assertion := &AssertionConfig{
+				Name:     testAssertionName2,
+				Metric:   "nonexistent_metric",
+				Operator: OperatorGt,
+				Value:    0,
+			}
+
+			// Empty metric families - metric doesn't exist
+			result := task.evaluateAssertion(assertion, map[string]*dto.MetricFamily{})
+
+			if tt.wantErr {
+				if result.err == nil {
+					t.Fatal("expected error, got nil")
+				}
+
+				if !strings.Contains(result.err.Error(), "not found") {
+					t.Errorf("error %q does not contain 'not found'", result.err.Error())
+				}
+			} else if result.err != nil {
+				t.Fatalf("unexpected error: %v", result.err)
+			}
+
+			if result.passed != tt.wantPass {
+				t.Errorf("passed = %v, want %v", result.passed, tt.wantPass)
+			}
+
+			if result.waiting != tt.wantWait {
+				t.Errorf("waiting = %v, want %v", result.waiting, tt.wantWait)
+			}
+		})
+	}
+}
+
+func TestEvaluateAssertion_MissingSeries(t *testing.T) {
+	tests := []struct {
+		name     string
+		behavior MissingBehavior
+		wantErr  bool
+		wantPass bool
+		wantWait bool
+	}{
+		{"wait on missing series", MissingBehaviorWait, false, false, true},
+		{"fail on missing series", MissingBehaviorFail, true, false, false},
+		{"pass on missing series", MissingBehaviorPass, false, true, false},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			task := newTestTask(&Config{MissingSeries: tt.behavior})
+			assertion := &AssertionConfig{
+				Name:     testAssertionName2,
+				Metric:   testMetric1,
+				Labels:   map[string]string{testLabelEnv: "nonexistent"},
+				Operator: OperatorGt,
+				Value:    0,
+			}
+
+			// Metric exists but labels don't match
+			families := map[string]*dto.MetricFamily{
+				testMetric1: makeCounterFamily(testMetric1, makeCounter(42, map[string]string{testLabelEnv: testValueProd})),
+			}
+			result := task.evaluateAssertion(assertion, families)
+
+			if tt.wantErr {
+				if result.err == nil {
+					t.Fatal("expected error, got nil")
+				}
+
+				if !strings.Contains(result.err.Error(), "no matching series") {
+					t.Errorf("error %q does not contain 'no matching series'", result.err.Error())
+				}
+			} else if result.err != nil {
+				t.Fatalf("unexpected error: %v", result.err)
+			}
+
+			if result.passed != tt.wantPass {
+				t.Errorf("passed = %v, want %v", result.passed, tt.wantPass)
+			}
+
+			if result.waiting != tt.wantWait {
+				t.Errorf("waiting = %v, want %v", result.waiting, tt.wantWait)
+			}
+		})
+	}
+}
+
+func TestEvaluateAssertion_AssertionOverridesBehavior(t *testing.T) {
+	// Global behavior is wait, but assertion overrides to fail
+	failBehavior := MissingBehaviorFail
+	task := newTestTask(&Config{MissingMetric: MissingBehaviorWait})
+	assertion := &AssertionConfig{
+		Name:          "testAssertionName2",
+		Metric:        "nonexistent_metric",
+		Operator:      OperatorGt,
+		Value:         0,
+		MissingMetric: &failBehavior,
+	}
+
+	result := task.evaluateAssertion(assertion, map[string]*dto.MetricFamily{})
+
+	if result.err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if result.waiting {
+		t.Error("expected waiting=false when override is fail")
+	}
+}
+
+func TestEvaluateAssertion_ValueMode(t *testing.T) {
+	tests := []struct {
+		name       string
+		metricVal  float64
+		operator   Operator
+		assertVal  float64
+		wantPassed bool
+	}{
+		{"gt passes", 100, OperatorGt, 50, true},
+		{"gt fails", 50, OperatorGt, 100, false},
+		{"eq passes", 42, OperatorEq, 42, true},
+		{"eq fails", 42, OperatorEq, 43, false},
+		{"lte passes", 50, OperatorLte, 50, true},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			task := newTestTask(&Config{})
+			assertion := &AssertionConfig{
+				Name:     testAssertionName2,
+				Metric:   testMetric1,
+				Mode:     AssertionModeValue,
+				Operator: tt.operator,
+				Value:    tt.assertVal,
+			}
+
+			families := map[string]*dto.MetricFamily{
+				testMetric1: makeCounterFamily(testMetric1, makeCounter(tt.metricVal, nil)),
+			}
+			result := task.evaluateAssertion(assertion, families)
+
+			if result.err != nil {
+				t.Fatalf("unexpected error: %v", result.err)
+			}
+
+			if result.waiting {
+				t.Error("unexpected waiting=true")
+			}
+
+			if result.passed != tt.wantPassed {
+				t.Errorf("passed = %v, want %v", result.passed, tt.wantPassed)
+			}
+
+			if result.value != tt.metricVal {
+				t.Errorf("value = %v, want %v", result.value, tt.metricVal)
+			}
+
+			if !math.IsNaN(result.delta) {
+				t.Errorf("delta = %v, want NaN", result.delta)
+			}
+		})
+	}
+}
+
+func TestEvaluateAssertion_DeltaMode_FirstScrape(t *testing.T) {
+	task := newTestTask(&Config{})
+	assertion := &AssertionConfig{
+		Name:     "delta_test",
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorGt,
+		Value:    10,
+	}
+
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeCounterFamily(testMetric1, makeCounter(100, nil)),
+	}
+
+	// First scrape should record baseline and wait
+	result := task.evaluateAssertion(assertion, families)
+
+	if !result.waiting {
+		t.Error("first scrape should wait")
+	}
+
+	if result.passed {
+		t.Error("first scrape should not pass yet")
+	}
+
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if task.baselines["delta_test"] != 100.0 {
+		t.Errorf("baseline = %v, want 100.0", task.baselines["delta_test"])
+	}
+}
+
+func TestEvaluateAssertion_DeltaMode_SecondScrape(t *testing.T) {
+	task := newTestTask(&Config{})
+	task.baselines["delta_test"] = 100.0 // Simulate first scrape
+
+	assertion := &AssertionConfig{
+		Name:     "delta_test",
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorGt,
+		Value:    10,
+	}
+
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeCounterFamily(testMetric1, makeCounter(150, nil)),
+	}
+
+	// Second scrape should evaluate delta (150 - 100 = 50)
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.waiting {
+		t.Error("second scrape should not wait")
+	}
+
+	if !result.passed {
+		t.Error("delta 50 > 10 should pass")
+	}
+
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if result.value != 150.0 {
+		t.Errorf("value = %v, want 150.0", result.value)
+	}
+
+	if result.delta != 50.0 {
+		t.Errorf("delta = %v, want 50.0", result.delta)
+	}
+}
+
+func TestEvaluateAssertion_CounterReset_Fail(t *testing.T) {
+	task := newTestTask(&Config{ResetBehavior: ResetBehaviorFail})
+	task.baselines[testResetName] = 100.0
+
+	assertion := &AssertionConfig{
+		Name:     testResetName,
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorGte,
+		Value:    0,
+	}
+
+	// Counter dropped from 100 to 50 (reset detected)
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeCounterFamily(testMetric1, makeCounter(50, nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(result.err.Error(), "counter reset detected") {
+		t.Errorf("error %q does not contain 'counter reset detected'", result.err.Error())
+	}
+}
+
+func TestEvaluateAssertion_CounterReset_Rebaseline(t *testing.T) {
+	task := newTestTask(&Config{ResetBehavior: ResetBehaviorRebaseline})
+	task.baselines[testResetName] = 100.0
+
+	assertion := &AssertionConfig{
+		Name:     testResetName,
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorGte,
+		Value:    0,
+	}
+
+	// Counter dropped from 100 to 50 (reset detected)
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeCounterFamily(testMetric1, makeCounter(50, nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if !result.waiting {
+		t.Error("should wait after rebaseline")
+	}
+
+	if task.baselines[testResetName] != 50.0 {
+		t.Errorf("baseline = %v, want 50.0", task.baselines[testResetName])
+	}
+}
+
+func TestEvaluateAssertion_CounterReset_Ignore(t *testing.T) {
+	task := newTestTask(&Config{ResetBehavior: ResetBehaviorIgnore})
+	task.baselines[testResetName] = 100.0
+
+	assertion := &AssertionConfig{
+		Name:     testResetName,
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorLt,
+		Value:    0,
+	}
+
+	// Counter dropped from 100 to 50 (reset detected but ignored)
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeCounterFamily(testMetric1, makeCounter(50, nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if result.waiting {
+		t.Error("should not wait when ignoring resets")
+	}
+
+	// Delta = 50 - 100 = -50, which is < 0
+	if !result.passed {
+		t.Error("negative delta should be allowed when ignoring resets")
+	}
+
+	if result.delta != -50.0 {
+		t.Errorf("delta = %v, want -50.0", result.delta)
+	}
+}
+
+func TestEvaluateAssertion_GaugeDecrease_NoReset(t *testing.T) {
+	// Gauges can decrease normally - this should NOT trigger reset detection
+	task := newTestTask(&Config{ResetBehavior: ResetBehaviorFail})
+	task.baselines["gauge_test"] = 100.0
+
+	assertion := &AssertionConfig{
+		Name:     "gauge_test",
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorLt,
+		Value:    0,
+	}
+
+	// Gauge dropped from 100 to 50 - this is normal for gauges
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeGaugeFamily(testMetric1, makeGauge(50, nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	// Should NOT error even though ResetBehavior is Fail - gauges don't reset
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if result.waiting {
+		t.Error("should not wait")
+	}
+
+	if !result.passed {
+		t.Error("gauge decrease should work normally")
+	}
+
+	if result.delta != -50.0 {
+		t.Errorf("delta = %v, want -50.0", result.delta)
+	}
+}
+
+func TestEvaluateAssertion_UntypedDecrease_NoReset(t *testing.T) {
+	// UNTYPED metrics (metrics without a TYPE declaration) should NOT trigger reset detection
+	task := newTestTask(&Config{ResetBehavior: ResetBehaviorFail})
+	task.baselines["untyped_test"] = 100.0
+
+	assertion := &AssertionConfig{
+		Name:     "untyped_test",
+		Metric:   testMetric1,
+		Mode:     AssertionModeDelta,
+		Operator: OperatorLt,
+		Value:    0,
+	}
+
+	// Untyped metric dropped from 100 to 50 - should NOT trigger reset detection
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeUntypedFamily(testMetric1, makeUntyped(50, nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	// Should NOT error even though ResetBehavior is Fail - only COUNTER type triggers reset
+	if result.err != nil {
+		t.Fatalf("unexpected error: %v", result.err)
+	}
+
+	if result.waiting {
+		t.Error("should not wait")
+	}
+
+	if !result.passed {
+		t.Error("untyped decrease should work normally without reset detection")
+	}
+
+	if result.delta != -50.0 {
+		t.Errorf("delta = %v, want -50.0", result.delta)
+	}
+}
+
+func TestEvaluateAssertion_NaN(t *testing.T) {
+	task := newTestTask(&Config{})
+	assertion := &AssertionConfig{
+		Name:     "nan_test",
+		Metric:   testMetric1,
+		Operator: OperatorGt,
+		Value:    0,
+	}
+
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeGaugeFamily(testMetric1, makeGauge(math.NaN(), nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(result.err.Error(), "non-finite") {
+		t.Errorf("error %q does not contain 'non-finite'", result.err.Error())
+	}
+}
+
+func TestEvaluateAssertion_Inf(t *testing.T) {
+	task := newTestTask(&Config{})
+	assertion := &AssertionConfig{
+		Name:     "inf_test",
+		Metric:   testMetric1,
+		Operator: OperatorGt,
+		Value:    0,
+	}
+
+	families := map[string]*dto.MetricFamily{
+		testMetric1: makeGaugeFamily(testMetric1, makeGauge(math.Inf(1), nil)),
+	}
+
+	result := task.evaluateAssertion(assertion, families)
+
+	if result.err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(result.err.Error(), "non-finite") {
+		t.Errorf("error %q does not contain 'non-finite'", result.err.Error())
+	}
+}
+
+func TestScrapeMetrics(t *testing.T) {
+	metricsBody := `# HELP test_counter A test counter
+# TYPE test_counter counter
+test_counter{env="prod"} 42
+test_counter{env="dev"} 10
+# HELP test_gauge A test gauge
+# TYPE test_gauge gauge
+test_gauge 3.14
+`
+
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.Header().Set("Content-Type", "text/plain")
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte(metricsBody))
+	}))
+	defer server.Close()
+
+	task := newTestTask(&Config{
+		URL:            server.URL,
+		RequestTimeout: helper.Duration{Duration: 5 * time.Second},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	families, err := task.scrapeMetrics(context.Background())
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if _, ok := families[testCounterMetric]; !ok {
+		t.Error("missing test_counter metric")
+	}
+
+	if _, ok := families["test_gauge"]; !ok {
+		t.Error("missing test_gauge metric")
+	}
+
+	// Verify counter values
+	counterFamily := families[testCounterMetric]
+	if counterFamily.GetType() != dto.MetricType_COUNTER {
+		t.Errorf("counter type = %v, want COUNTER", counterFamily.GetType())
+	}
+
+	if len(counterFamily.GetMetric()) != 2 {
+		t.Errorf("counter metric count = %d, want 2", len(counterFamily.GetMetric()))
+	}
+
+	// Verify gauge value
+	gaugeFamily := families["test_gauge"]
+	if gaugeFamily.GetType() != dto.MetricType_GAUGE {
+		t.Errorf("gauge type = %v, want GAUGE", gaugeFamily.GetType())
+	}
+
+	if len(gaugeFamily.GetMetric()) != 1 {
+		t.Errorf("gauge metric count = %d, want 1", len(gaugeFamily.GetMetric()))
+	}
+}
+
+func TestScrapeMetrics_HTTPError(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusInternalServerError)
+	}))
+	defer server.Close()
+
+	task := newTestTask(&Config{URL: server.URL})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	_, err := task.scrapeMetrics(context.Background())
+	if err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(err.Error(), "500") {
+		t.Errorf("error %q does not contain '500'", err.Error())
+	}
+}
+
+func TestScrapeMetrics_ResponseTooLarge(t *testing.T) {
+	// Create a response larger than the limit
+	largeBody := make([]byte, 100)
+	for i := range largeBody {
+		largeBody[i] = 'x'
+	}
+
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write(largeBody)
+	}))
+	defer server.Close()
+
+	task := newTestTask(&Config{
+		URL:                  server.URL,
+		maxResponseSizeBytes: 50,
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	_, err := task.scrapeMetrics(context.Background())
+	if err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(err.Error(), "exceeds max size") {
+		t.Errorf("error %q does not contain 'exceeds max size'", err.Error())
+	}
+}
+
+func TestScrapeMetrics_InvalidPrometheusFormat(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("this is not prometheus format {{{"))
+	}))
+	defer server.Close()
+
+	task := newTestTask(&Config{URL: server.URL})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	_, err := task.scrapeMetrics(context.Background())
+	if err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(err.Error(), "parse") {
+		t.Errorf("error %q does not contain 'parse'", err.Error())
+	}
+}
+
+func TestScrapeMetrics_CustomHeaders(t *testing.T) {
+	var receivedAuth string
+
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		receivedAuth = r.Header.Get("Authorization")
+
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("# HELP m A metric\n# TYPE m gauge\nm 1\n"))
+	}))
+	defer server.Close()
+
+	task := newTestTask(&Config{
+		URL:     server.URL,
+		Headers: map[string]string{"Authorization": "Bearer token123"},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	_, err := task.scrapeMetrics(context.Background())
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if receivedAuth != "Bearer token123" {
+		t.Errorf("Authorization header = %q, want 'Bearer token123'", receivedAuth)
+	}
+}
+
+func newTestTaskWithContext(cfg *Config) (*Task, types.Variables, *types.TaskResult) {
+	logger := logrus.New()
+	logger.SetLevel(logrus.PanicLevel)
+
+	outputs := vars.NewVariables(nil)
+
+	var lastResult types.TaskResult
+
+	ctx := &types.TaskContext{
+		Outputs:        outputs,
+		SetResult:      func(r types.TaskResult) { lastResult = r },
+		ReportProgress: func(_ float64, _ string) {},
+	}
+
+	var config Config
+	if cfg != nil {
+		config = *cfg
+	}
+
+	task := &Task{
+		ctx:       ctx,
+		config:    config,
+		logger:    logger,
+		baselines: make(map[string]float64),
+	}
+
+	return task, outputs, &lastResult
+}
+
+func TestRunCheck_ScrapeError_FailOnCheckMiss(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusInternalServerError)
+	}))
+	defer server.Close()
+
+	task, outputs, result := newTestTaskWithContext(&Config{
+		URL:             server.URL,
+		FailOnCheckMiss: true,
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	if !done {
+		t.Error("expected done=true")
+	}
+
+	if err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if !strings.Contains(err.Error(), "scrape failed") {
+		t.Errorf("error %q does not contain 'scrape failed'", err.Error())
+	}
+
+	if *result != types.TaskResultFailure {
+		t.Errorf("result = %v, want TaskResultFailure", *result)
+	}
+
+	if outputs.GetVar("scrapeErrors") != 1 {
+		t.Errorf("scrapeErrors = %v, want 1", outputs.GetVar("scrapeErrors"))
+	}
+}
+
+func TestRunCheck_ScrapeError_RetryOnFail(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusInternalServerError)
+	}))
+	defer server.Close()
+
+	task, outputs, result := newTestTaskWithContext(&Config{
+		URL:             server.URL,
+		FailOnCheckMiss: false,
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	if done {
+		t.Error("expected done=false")
+	}
+
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if *result != types.TaskResultNone {
+		t.Errorf("result = %v, want TaskResultNone", *result)
+	}
+
+	if outputs.GetVar("scrapeErrors") != 1 {
+		t.Errorf("scrapeErrors = %v, want 1", outputs.GetVar("scrapeErrors"))
+	}
+}
+
+func TestRunCheck_AllAssertionsPass(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("# TYPE test_counter counter\ntest_counter 100\n"))
+	}))
+	defer server.Close()
+
+	task, outputs, result := newTestTaskWithContext(&Config{
+		URL:           server.URL,
+		MissingMetric: MissingBehaviorFail,
+		MissingSeries: MissingBehaviorFail,
+		Assertions: []AssertionConfig{
+			{Name: testCheckCounterAssert, Metric: testCounterMetric, Mode: AssertionModeValue, Operator: OperatorGte, Value: 50},
+		},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	if !done {
+		t.Error("expected done=true")
+	}
+
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if *result != types.TaskResultSuccess {
+		t.Errorf("result = %v, want TaskResultSuccess", *result)
+	}
+
+	passed, ok := outputs.GetVar("passedAssertions").([]interface{})
+	if !ok {
+		t.Fatalf("passedAssertions type = %T, want []interface{}", outputs.GetVar("passedAssertions"))
+	}
+
+	if len(passed) != 1 {
+		t.Errorf("passedAssertions length = %d, want 1", len(passed))
+	}
+
+	if len(passed) > 0 && passed[0] != testCheckCounterAssert {
+		t.Errorf("passedAssertions[0] = %v, want %q", passed[0], testCheckCounterAssert)
+	}
+}
+
+func TestRunCheck_AssertionFails(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("# TYPE test_counter counter\ntest_counter 10\n"))
+	}))
+	defer server.Close()
+
+	task, outputs, result := newTestTaskWithContext(&Config{
+		URL:             server.URL,
+		FailOnCheckMiss: true,
+		MissingMetric:   MissingBehaviorFail,
+		MissingSeries:   MissingBehaviorFail,
+		Assertions: []AssertionConfig{
+			{Name: testCheckCounterAssert, Metric: testCounterMetric, Mode: AssertionModeValue, Operator: OperatorGte, Value: 50},
+		},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	if !done {
+		t.Error("expected done=true")
+	}
+
+	if err == nil {
+		t.Fatal("expected error, got nil")
+	}
+
+	if *result != types.TaskResultFailure {
+		t.Errorf("result = %v, want TaskResultFailure", *result)
+	}
+
+	failed, ok := outputs.GetVar("failedAssertions").([]interface{})
+	if !ok {
+		t.Fatalf("failedAssertions type = %T, want []interface{}", outputs.GetVar("failedAssertions"))
+	}
+
+	if len(failed) != 1 {
+		t.Errorf("failedAssertions length = %d, want 1", len(failed))
+	}
+
+	if len(failed) > 0 && failed[0] != testCheckCounterAssert {
+		t.Errorf("failedAssertions[0] = %v, want %q", failed[0], testCheckCounterAssert)
+	}
+}
+
+func TestRunCheck_MixedAssertions(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("# TYPE metric_a counter\nmetric_a 100\n# TYPE metric_b counter\nmetric_b 5\n"))
+	}))
+	defer server.Close()
+
+	task, outputs, result := newTestTaskWithContext(&Config{
+		URL:             server.URL,
+		FailOnCheckMiss: false,
+		MissingMetric:   MissingBehaviorWait,
+		MissingSeries:   MissingBehaviorWait,
+		Assertions: []AssertionConfig{
+			{Name: "a_passes", Metric: "metric_a", Mode: AssertionModeValue, Operator: OperatorGte, Value: 50},
+			{Name: "b_fails", Metric: "metric_b", Mode: AssertionModeValue, Operator: OperatorGte, Value: 50},
+			{Name: "c_waits", Metric: "metric_missing", Mode: AssertionModeValue, Operator: OperatorGte, Value: 0},
+		},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	// Should keep waiting because one assertion is waiting
+	if done {
+		t.Error("expected done=false")
+	}
+
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if *result != types.TaskResultNone {
+		t.Errorf("result = %v, want TaskResultNone", *result)
+	}
+
+	passed, ok := outputs.GetVar("passedAssertions").([]interface{})
+	if !ok {
+		t.Fatalf("passedAssertions type = %T, want []interface{}", outputs.GetVar("passedAssertions"))
+	}
+
+	foundAPasses := false
+
+	for _, p := range passed {
+		if p == "a_passes" {
+			foundAPasses = true
+		}
+	}
+
+	if !foundAPasses {
+		t.Error("passedAssertions should contain 'a_passes'")
+	}
+
+	failed, ok := outputs.GetVar("failedAssertions").([]interface{})
+	if !ok {
+		t.Fatalf("failedAssertions type = %T, want []interface{}", outputs.GetVar("failedAssertions"))
+	}
+
+	foundBFails := false
+
+	for _, f := range failed {
+		if f == "b_fails" {
+			foundBFails = true
+		}
+	}
+
+	if !foundBFails {
+		t.Error("failedAssertions should contain 'b_fails'")
+	}
+}
+
+func TestRunCheck_AssertionErrorIncrement(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		// Metric with multiple matching series (causes assertion error)
+		_, _ = w.Write([]byte("# TYPE m counter\nm{env=\"a\"} 1\nm{env=\"b\"} 2\n"))
+	}))
+	defer server.Close()
+
+	task, outputs, _ := newTestTaskWithContext(&Config{
+		URL:             server.URL,
+		FailOnCheckMiss: false,
+		MissingMetric:   MissingBehaviorFail,
+		MissingSeries:   MissingBehaviorFail,
+		Assertions: []AssertionConfig{
+			{Name: "ambiguous", Metric: "m", Mode: AssertionModeValue, Operator: OperatorGte, Value: 0},
+		},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	_, _ = task.runCheck(context.Background())
+
+	if outputs.GetVar("assertionErrors") != 1 {
+		t.Errorf("assertionErrors = %v, want 1", outputs.GetVar("assertionErrors"))
+	}
+}
+
+func TestRunCheck_ContinueOnPass(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+		_, _ = w.Write([]byte("# TYPE my_counter counter\nmy_counter 100\n"))
+	}))
+	defer server.Close()
+
+	task, _, result := newTestTaskWithContext(&Config{
+		URL:            server.URL,
+		ContinueOnPass: true,
+		MissingMetric:  MissingBehaviorFail,
+		MissingSeries:  MissingBehaviorFail,
+		Assertions: []AssertionConfig{
+			{Name: "check", Metric: "my_counter", Mode: AssertionModeValue, Operator: OperatorGte, Value: 50},
+		},
+	})
+	task.httpClient = &http.Client{Timeout: 5 * time.Second}
+
+	done, err := task.runCheck(context.Background())
+
+	// Should continue even though all assertions pass
+	if done {
+		t.Error("expected done=false with continueOnPass")
+	}
+
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+
+	if *result != types.TaskResultSuccess {
+		t.Errorf("result = %v, want TaskResultSuccess", *result)
+	}
+}
diff --git a/pkg/tasks/tasks.go b/pkg/tasks/tasks.go
index 16d066de..ace4be72 100644
--- a/pkg/tasks/tasks.go
+++ b/pkg/tasks/tasks.go
@@ -19,6 +19,7 @@ import (
 	checkethcall "github.com/ethpandaops/assertoor/pkg/tasks/check_eth_call"
 	checkethconfig "github.com/ethpandaops/assertoor/pkg/tasks/check_eth_config"
 	checkexecutionsyncstatus "github.com/ethpandaops/assertoor/pkg/tasks/check_execution_sync_status"
+	checkhttpmetrics "github.com/ethpandaops/assertoor/pkg/tasks/check_http_metrics"
 	generateattestations "github.com/ethpandaops/assertoor/pkg/tasks/generate_attestations"
 	generatebatchdeposits "github.com/ethpandaops/assertoor/pkg/tasks/generate_batch_deposits"
 	generateblobtransactions "github.com/ethpandaops/assertoor/pkg/tasks/generate_blob_transactions"
@@ -71,6 +72,7 @@ var AvailableTaskDescriptors = []*types.TaskDescriptor{
 	checkexecutionblock.TaskDescriptor,
 	checkethcall.TaskDescriptor,
 	checkethconfig.TaskDescriptor,
+	checkhttpmetrics.TaskDescriptor,
 	checkexecutionsyncstatus.TaskDescriptor,
 	generateattestations.TaskDescriptor,
 	generatebatchdeposits.TaskDescriptor,

From e218f5d6090b1b23e13958c5e75340b9ae6d5803 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Thu, 21 May 2026 23:54:53 +0530
Subject: [PATCH 3/8] docs: add README for check_http_metrics

---
 pkg/tasks/check_http_metrics/README.md | 99 ++++++++++++++++++++++++++
 1 file changed, 99 insertions(+)
 create mode 100644 pkg/tasks/check_http_metrics/README.md

diff --git a/pkg/tasks/check_http_metrics/README.md b/pkg/tasks/check_http_metrics/README.md
new file mode 100644
index 00000000..637af8cd
--- /dev/null
+++ b/pkg/tasks/check_http_metrics/README.md
@@ -0,0 +1,99 @@
+## `check_http_metrics` Task
+
+### Description
+The `check_http_metrics` task fetches metrics from an HTTP Prometheus endpoint and evaluates assertions against metric values.
+
+#### Task Behavior
+- The task polls the metrics endpoint at regular intervals.
+- By default, the task returns immediately when all assertions pass.
+- Use `continueOnPass: true` to keep monitoring even after success.
+- Use `failOnCheckMiss: true` to fail immediately when assertions are not met.
+
+### Configuration Parameters
+
+- **`url`**:\
+  HTTP URL of the Prometheus metrics endpoint. Required.
+
+- **`headers`**:\
+  Optional HTTP request headers (e.g., for authentication). Default: `{}`.
+
+- **`pollInterval`**:\
+  Interval between metric scrapes. Default: `10s`.
+
+- **`requestTimeout`**:\
+  Timeout for a single HTTP request. Default: `5s`.
+
+- **`maxResponseSize`**:\
+  Maximum response body size. Must be positive. Default: `10MB`.
+
+- **`failOnCheckMiss`**:\
+  If `true`, fail immediately when assertions are not met. If `false`, keep polling until timeout or success. Default: `false`.
+
+- **`continueOnPass`**:\
+  If `true`, continue checking after all assertions pass. Default: `false`.
+
+- **`missingMetric`**:\
+  Behavior when a metric family is missing: `wait`, `fail`, or `pass`. Default: `wait`.
+
+- **`missingSeries`**:\
+  Behavior when no time series matches the label selector: `wait`, `fail`, or `pass`. Default: `wait`.
+
+- **`resetBehavior`**:\
+  Behavior when a COUNTER metric's value drops below baseline (indicating restart): `fail`, `rebaseline`, or `ignore`. Only applies to COUNTER type metrics. Default: `fail`.
+
+- **`assertions`**:\
+  List of metric assertions. At least one required. Example:
+  ```yaml
+  - { "name": "counter_increased", "metric": "my_counter", "labels": { "env": "prod" }, "mode": "delta", "operator": "gt", "value": 0 }
+  ```
+
+#### Assertion Configuration
+
+- **`name`**: Unique assertion name. Required.
+- **`metric`**: Prometheus metric name. Required.
+- **`labels`**: Label selector (subset matching). Must match exactly one series.
+- **`mode`**: `value` (current value) or `delta` (change since baseline). Default: `value`.
+- **`operator`**: Comparison operator: `eq`, `neq`, `gt`, `gte`, `lt`, `lte`. Required.
+- **`value`**: Expected numeric value. Required.
+- **`missingMetric`**: Per-assertion override for global `missingMetric`.
+- **`missingSeries`**: Per-assertion override for global `missingSeries`.
+
+#### Metric Type Handling
+
+| Type | Value Extracted |
+|------|-----------------|
+| COUNTER | Counter value |
+| GAUGE | Gauge value |
+| UNTYPED | Untyped value |
+| SUMMARY | Sample sum |
+| HISTOGRAM | Sample sum |
+
+Counter reset detection only applies to COUNTER type. SUMMARY and HISTOGRAM use sample sum; bucket/quantile helpers are not supported.
+
+### Outputs
+
+- **`passedAssertions`**: Array of assertion names that passed.
+- **`failedAssertions`**: Array of assertion names that failed.
+- **`values`**: Map of assertion name to latest observed value.
+- **`deltas`**: Map of assertion name to computed delta (for `delta` mode).
+- **`baselines`**: Map of assertion name to baseline value (for `delta` mode).
+- **`scrapeErrors`**: Number of HTTP/parsing errors.
+- **`assertionErrors`**: Number of assertion evaluation errors.
+
+### Defaults
+
+```yaml
+- name: check_http_metrics
+  config:
+    url: ""
+    headers: {}
+    pollInterval: 10s
+    requestTimeout: 5s
+    maxResponseSize: 10MB
+    failOnCheckMiss: false
+    continueOnPass: false
+    missingMetric: wait
+    missingSeries: wait
+    resetBehavior: fail
+    assertions: []
+```

From 2da20a6f5c8928de84724759bf279615860eff97 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Thu, 21 May 2026 23:56:37 +0530
Subject: [PATCH 4/8] docs: update check_http_metrics README with delta usage

---
 pkg/tasks/check_http_metrics/README.md | 40 +++++++++++++++++++++++---
 1 file changed, 36 insertions(+), 4 deletions(-)

diff --git a/pkg/tasks/check_http_metrics/README.md b/pkg/tasks/check_http_metrics/README.md
index 637af8cd..54526471 100644
--- a/pkg/tasks/check_http_metrics/README.md
+++ b/pkg/tasks/check_http_metrics/README.md
@@ -42,10 +42,7 @@ The `check_http_metrics` task fetches metrics from an HTTP Prometheus endpoint a
   Behavior when a COUNTER metric's value drops below baseline (indicating restart): `fail`, `rebaseline`, or `ignore`. Only applies to COUNTER type metrics. Default: `fail`.
 
 - **`assertions`**:\
-  List of metric assertions. At least one required. Example:
-  ```yaml
-  - { "name": "counter_increased", "metric": "my_counter", "labels": { "env": "prod" }, "mode": "delta", "operator": "gt", "value": 0 }
-  ```
+  List of metric assertions. At least one required.
 
 #### Assertion Configuration
 
@@ -58,6 +55,41 @@ The `check_http_metrics` task fetches metrics from an HTTP Prometheus endpoint a
 - **`missingMetric`**: Per-assertion override for global `missingMetric`.
 - **`missingSeries`**: Per-assertion override for global `missingSeries`.
 
+#### Delta Mode
+
+In `delta` mode, the task tracks changes over time:
+1. First scrape: records the current value as baseline (waits, does not evaluate)
+2. Subsequent scrapes: computes `delta = current - baseline` and evaluates
+
+Negative deltas are valid for GAUGE and UNTYPED metrics. For COUNTER metrics, a decrease triggers `resetBehavior`.
+
+#### Examples
+
+```yaml
+assertions:
+  # Check counter increased by at least 1
+  - name: counter_increased
+    metric: my_counter
+    labels:
+      env: prod
+    mode: delta
+    operator: gte
+    value: 1
+
+  # Check gauge decreased (negative delta)
+  - name: gauge_dropped
+    metric: my_gauge
+    mode: delta
+    operator: lte
+    value: -1
+
+  # Check current value is above threshold
+  - name: value_above_threshold
+    metric: my_metric
+    operator: gt
+    value: 100
+```
+
 #### Metric Type Handling
 
 | Type | Value Extracted |

From e5d50936dc3583f59ecc1375b8596a248ce77546 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Fri, 22 May 2026 00:05:07 +0530
Subject: [PATCH 5/8] refactor: fix styling, follow pandaops go practices

---
 pkg/tasks/check_http_metrics/config.go | 11 ++++++-----
 pkg/tasks/check_http_metrics/task.go   | 23 ++++++++++++++++++-----
 2 files changed, 24 insertions(+), 10 deletions(-)

diff --git a/pkg/tasks/check_http_metrics/config.go b/pkg/tasks/check_http_metrics/config.go
index 84c67a7c..e3d726ed 100644
--- a/pkg/tasks/check_http_metrics/config.go
+++ b/pkg/tasks/check_http_metrics/config.go
@@ -17,11 +17,11 @@ const (
 	MissingBehaviorWait MissingBehavior = "wait"
 	MissingBehaviorFail MissingBehavior = "fail"
 	MissingBehaviorPass MissingBehavior = "pass"
-
-	// DefaultMaxResponseSize is the default maximum response body size for metrics scraping.
-	DefaultMaxResponseSize = "10MB"
 )
 
+// DefaultMaxResponseSize is the default maximum response body size for metrics scraping.
+const DefaultMaxResponseSize = "10MB"
+
 // ResetBehavior controls what happens when a counter value drops below its baseline,
 // which typically indicates a service restart or counter reset.
 type ResetBehavior string
@@ -54,11 +54,12 @@ const (
 )
 
 // AssertionConfig defines a single metric assertion to evaluate.
-// Labels must match exactly one time series; matching zero or multiple series is an error.
+// Labels are a subset selector that must match exactly one time series;
+// matching zero or multiple series is an error.
 type AssertionConfig struct {
 	Name          string            `yaml:"name" json:"name" desc:"Unique human-readable assertion name."`
 	Metric        string            `yaml:"metric" json:"metric" desc:"Prometheus metric name."`
-	Labels        map[string]string `yaml:"labels" json:"labels" desc:"Exact label match for the time series."`
+	Labels        map[string]string `yaml:"labels" json:"labels" desc:"Label selector; all specified labels must match and select exactly one time series."`
 	Mode          AssertionMode     `yaml:"mode" json:"mode" desc:"Evaluation mode: 'value' (current value) or 'delta' (change since baseline)."`
 	Operator      Operator          `yaml:"operator" json:"operator" desc:"Comparison operator: eq, neq, gt, gte, lt, lte."`
 	Value         float64           `yaml:"value" json:"value" desc:"Expected value for comparison."`
diff --git a/pkg/tasks/check_http_metrics/task.go b/pkg/tasks/check_http_metrics/task.go
index 8843579c..2ddedbc8 100644
--- a/pkg/tasks/check_http_metrics/task.go
+++ b/pkg/tasks/check_http_metrics/task.go
@@ -20,6 +20,9 @@ import (
 
 const outputTypeObject = "object"
 
+// Compile-time interface compliance check.
+var _ types.Task = (*Task)(nil)
+
 var (
 	TaskName       = "check_http_metrics"
 	TaskDescriptor = &types.TaskDescriptor{
@@ -267,25 +270,35 @@ func (t *Task) setOutputs(out *checkOutputs) {
 		t.ctx.Outputs.SetVar("values", map[string]float64{})
 		t.ctx.Outputs.SetVar("deltas", map[string]float64{})
 	} else {
-		if data, err := vars.GeneralizeData(out.passedAssertions); err == nil {
+		if data, err := vars.GeneralizeData(out.passedAssertions); err != nil {
+			t.logger.Warnf("failed to generalize passedAssertions: %v", err)
+		} else {
 			t.ctx.Outputs.SetVar("passedAssertions", data)
 		}
 
-		if data, err := vars.GeneralizeData(out.failedAssertions); err == nil {
+		if data, err := vars.GeneralizeData(out.failedAssertions); err != nil {
+			t.logger.Warnf("failed to generalize failedAssertions: %v", err)
+		} else {
 			t.ctx.Outputs.SetVar("failedAssertions", data)
 		}
 
-		if data, err := vars.GeneralizeData(out.values); err == nil {
+		if data, err := vars.GeneralizeData(out.values); err != nil {
+			t.logger.Warnf("failed to generalize values: %v", err)
+		} else {
 			t.ctx.Outputs.SetVar("values", data)
 		}
 
-		if data, err := vars.GeneralizeData(out.deltas); err == nil {
+		if data, err := vars.GeneralizeData(out.deltas); err != nil {
+			t.logger.Warnf("failed to generalize deltas: %v", err)
+		} else {
 			t.ctx.Outputs.SetVar("deltas", data)
 		}
 	}
 
 	// Baselines
-	if data, err := vars.GeneralizeData(t.baselines); err == nil {
+	if data, err := vars.GeneralizeData(t.baselines); err != nil {
+		t.logger.Warnf("failed to generalize baselines: %v", err)
+	} else {
 		t.ctx.Outputs.SetVar("baselines", data)
 	}
 

From d50cf34c0361adfec2de1bd2317328893153d391 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Tue, 26 May 2026 11:22:42 +0200
Subject: [PATCH 6/8] refactor(check_http_metrics): set maxResponseSize default
 in Validate()

Move the default maxResponseSize handling from the getter fallback to
Validate(). This ensures a single source of truth for the default value
and guarantees maxResponseSizeBytes is always populated after validation.

- Validate() now sets DefaultMaxResponseSize if MaxResponseSize is empty
- Simplified GetMaxResponseSizeBytes() to just return the value
- Removed redundant fallback that duplicated the default

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 pkg/tasks/check_http_metrics/config.go | 32 ++++++++++++--------------
 1 file changed, 15 insertions(+), 17 deletions(-)

diff --git a/pkg/tasks/check_http_metrics/config.go b/pkg/tasks/check_http_metrics/config.go
index e3d726ed..8e7b73b3 100644
--- a/pkg/tasks/check_http_metrics/config.go
+++ b/pkg/tasks/check_http_metrics/config.go
@@ -115,24 +115,26 @@ func (c *Config) Validate() error {
 		return fmt.Errorf("requestTimeout must be positive")
 	}
 
-	// Parse max response size
-	if c.MaxResponseSize != "" {
-		size, err := humanize.ParseBytes(c.MaxResponseSize)
-		if err != nil {
-			return fmt.Errorf("invalid maxResponseSize %q: %w", c.MaxResponseSize, err)
-		}
+	// Set default and parse max response size
+	if c.MaxResponseSize == "" {
+		c.MaxResponseSize = DefaultMaxResponseSize
+	}
 
-		if size == 0 {
-			return fmt.Errorf("maxResponseSize must be positive")
-		}
+	size, err := humanize.ParseBytes(c.MaxResponseSize)
+	if err != nil {
+		return fmt.Errorf("invalid maxResponseSize %q: %w", c.MaxResponseSize, err)
+	}
 
-		if size > math.MaxInt64 {
-			return fmt.Errorf("maxResponseSize %q exceeds maximum allowed value", c.MaxResponseSize)
-		}
+	if size == 0 {
+		return fmt.Errorf("maxResponseSize must be positive")
+	}
 
-		c.maxResponseSizeBytes = int64(size)
+	if size > math.MaxInt64 {
+		return fmt.Errorf("maxResponseSize %q exceeds maximum allowed value", c.MaxResponseSize)
 	}
 
+	c.maxResponseSizeBytes = int64(size)
+
 	// Validate assertions and check for duplicate names
 	seenNames := make(map[string]bool, len(c.Assertions))
 
@@ -189,10 +191,6 @@ func (c *Config) Validate() error {
 }
 
 func (c *Config) GetMaxResponseSizeBytes() int64 {
-	if c.maxResponseSizeBytes == 0 {
-		return 10 * 1024 * 1024 // 10MB default
-	}
-
 	return c.maxResponseSizeBytes
 }
 

From 9c18219e764e876e92311ba91a44b8a6c55178c9 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Tue, 26 May 2026 11:23:01 +0200
Subject: [PATCH 7/8] test(check_http_metrics): add full-cycle integration
 tests

Add integration tests that mirror production usage by starting from
DefaultConfig(), calling Validate(), and executing the full task flow.
These tests verify the complete lifecycle and catch issues like missing
defaults that unit tests may miss.

New tests:
- TestIntegration_ValueMode: basic value assertion with label matching
- TestIntegration_DeltaMode: delta mode with baseline and evaluation
- TestIntegration_MultipleAssertions: multiple assertions on different metrics

Also updated test helpers to use decimal MB values (10,000,000) consistent
with humanize.ParseBytes("10MB") and fixed TestGetMaxResponseSizeBytes to
test the new Validate() behavior.

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 pkg/tasks/check_http_metrics/task_test.go | 375 ++++++++++++++++++++--
 1 file changed, 351 insertions(+), 24 deletions(-)

diff --git a/pkg/tasks/check_http_metrics/task_test.go b/pkg/tasks/check_http_metrics/task_test.go
index 60aa924e..d52e122f 100644
--- a/pkg/tasks/check_http_metrics/task_test.go
+++ b/pkg/tasks/check_http_metrics/task_test.go
@@ -2,6 +2,7 @@ package checkhttpmetrics
 
 import (
 	"context"
+	"fmt"
 	"math"
 	"net/http"
 	"net/http/httptest"
@@ -24,6 +25,7 @@ const (
 	testLabelBar           = "bar"
 	testLabelEnv           = "env"
 	testLabelRegion        = "region"
+	testLabelHost          = "host"
 	testValueProd          = "prod"
 	testAssertionName      = "test"
 	testAssertionName2     = "test_assertion"
@@ -374,31 +376,46 @@ func TestDefaultConfig(t *testing.T) {
 }
 
 func TestGetMaxResponseSizeBytes(t *testing.T) {
-	tests := []struct {
-		name string
-		cfg  Config
-		want int64
-	}{
-		{
-			name: "default when not set",
-			cfg:  Config{},
-			want: 10 * 1024 * 1024,
-		},
-		{
-			name: "parsed value",
-			cfg:  Config{MaxResponseSize: "5MB", maxResponseSizeBytes: 5 * 1024 * 1024},
-			want: 5 * 1024 * 1024,
-		},
-	}
+	// Test that Validate() sets the default when MaxResponseSize is empty
+	t.Run("default set by Validate when empty", func(t *testing.T) {
+		cfg := Config{
+			URL:            "http://example.com",
+			PollInterval:   helper.Duration{Duration: time.Second},
+			RequestTimeout: helper.Duration{Duration: time.Second},
+			Assertions:     []AssertionConfig{{Name: testAssertionName, Metric: "m", Operator: OperatorEq}},
+		}
+		if err := cfg.Validate(); err != nil {
+			t.Fatalf("Validate() failed: %v", err)
+		}
 
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			got := tt.cfg.GetMaxResponseSizeBytes()
-			if got != tt.want {
-				t.Errorf("GetMaxResponseSizeBytes() = %v, want %v", got, tt.want)
-			}
-		})
-	}
+		got := cfg.GetMaxResponseSizeBytes()
+		want := int64(10 * 1000 * 1000) // 10MB = 10,000,000 bytes (decimal)
+
+		if got != want {
+			t.Errorf("GetMaxResponseSizeBytes() = %v, want %v", got, want)
+		}
+	})
+
+	// Test that Validate() parses custom MaxResponseSize
+	t.Run("custom value parsed by Validate", func(t *testing.T) {
+		cfg := Config{
+			URL:             "http://example.com",
+			MaxResponseSize: "5MB",
+			PollInterval:    helper.Duration{Duration: time.Second},
+			RequestTimeout:  helper.Duration{Duration: time.Second},
+			Assertions:      []AssertionConfig{{Name: testAssertionName, Metric: "m", Operator: OperatorEq}},
+		}
+		if err := cfg.Validate(); err != nil {
+			t.Fatalf("Validate() failed: %v", err)
+		}
+
+		got := cfg.GetMaxResponseSizeBytes()
+		want := int64(5 * 1000 * 1000) // 5MB = 5,000,000 bytes (decimal)
+
+		if got != want {
+			t.Errorf("GetMaxResponseSizeBytes() = %v, want %v", got, want)
+		}
+	})
 }
 
 func TestValidateMissingBehavior(t *testing.T) {
@@ -467,6 +484,12 @@ func newTestTask(cfg *Config) *Task {
 		c = *cfg
 	}
 
+	// Ensure maxResponseSizeBytes has a default for tests that don't call Validate
+	// Use decimal value (10MB = 10,000,000) consistent with humanize.ParseBytes
+	if c.maxResponseSizeBytes == 0 {
+		c.maxResponseSizeBytes = 10 * 1000 * 1000
+	}
+
 	return &Task{
 		config:    c,
 		logger:    logger,
@@ -1306,6 +1329,12 @@ func newTestTaskWithContext(cfg *Config) (*Task, types.Variables, *types.TaskRes
 		config = *cfg
 	}
 
+	// Ensure maxResponseSizeBytes has a default for tests that don't call Validate
+	// Use decimal value (10MB = 10,000,000) consistent with humanize.ParseBytes
+	if config.maxResponseSizeBytes == 0 {
+		config.maxResponseSizeBytes = 10 * 1000 * 1000
+	}
+
 	task := &Task{
 		ctx:       ctx,
 		config:    config,
@@ -1602,3 +1631,301 @@ func TestRunCheck_ContinueOnPass(t *testing.T) {
 		t.Errorf("result = %v, want TaskResultSuccess", *result)
 	}
 }
+
+// =============================================================================
+// Full-Cycle Integration Tests
+// =============================================================================
+// These tests verify the complete flow from DefaultConfig() through Validate()
+// to execution, mirroring how the task is used in production.
+
+func TestIntegration_ValueMode(t *testing.T) {
+	// Setup mock metrics server
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		_, _ = w.Write([]byte(`
+# HELP http_requests_total Total HTTP requests
+# TYPE http_requests_total counter
+http_requests_total{method="GET",status="200"} 150
+http_requests_total{method="POST",status="200"} 50
+`))
+	}))
+	defer server.Close()
+
+	// Start from DefaultConfig (like production)
+	cfg := DefaultConfig()
+	cfg.URL = server.URL
+	cfg.Assertions = []AssertionConfig{
+		{
+			Name:     "get_requests_above_100",
+			Metric:   "http_requests_total",
+			Labels:   map[string]string{"method": "GET", "status": "200"},
+			Mode:     AssertionModeValue,
+			Operator: OperatorGt,
+			Value:    100,
+		},
+	}
+
+	// Validate (like production)
+	if err := cfg.Validate(); err != nil {
+		t.Fatalf("Validate() failed: %v", err)
+	}
+
+	// Verify maxResponseSizeBytes was set by Validate
+	if cfg.GetMaxResponseSizeBytes() == 0 {
+		t.Fatal("maxResponseSizeBytes should be set after Validate()")
+	}
+
+	// Create task with context (like production)
+	logger := logrus.New()
+	logger.SetLevel(logrus.PanicLevel)
+
+	outputs := vars.NewVariables(nil)
+
+	var lastResult types.TaskResult
+
+	ctx := &types.TaskContext{
+		Outputs:        outputs,
+		SetResult:      func(r types.TaskResult) { lastResult = r },
+		ReportProgress: func(_ float64, _ string) {},
+	}
+
+	task := &Task{
+		ctx:        ctx,
+		config:     cfg,
+		logger:     logger,
+		baselines:  make(map[string]float64),
+		httpClient: &http.Client{Timeout: cfg.RequestTimeout.Duration},
+	}
+
+	// Run check
+	done, err := task.runCheck(context.Background())
+	if err != nil {
+		t.Fatalf("runCheck() error: %v", err)
+	}
+
+	if !done {
+		t.Error("expected done=true when assertion passes")
+	}
+
+	if lastResult != types.TaskResultSuccess {
+		t.Errorf("result = %v, want TaskResultSuccess", lastResult)
+	}
+
+	// Verify outputs
+	passed := outputs.GetVar("passedAssertions")
+	if passed == nil {
+		t.Fatal("passedAssertions output not set")
+	}
+
+	passedList, ok := passed.([]any)
+	if !ok {
+		t.Fatalf("passedAssertions type = %T, want []any", passed)
+	}
+
+	if len(passedList) != 1 || passedList[0] != "get_requests_above_100" {
+		t.Errorf("passedAssertions = %v, want [get_requests_above_100]", passedList)
+	}
+}
+
+func TestIntegration_DeltaMode(t *testing.T) {
+	requestCount := 0
+
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		requestCount++
+
+		// First scrape: baseline of 100
+		// Second scrape: value of 150 (delta = 50)
+		value := 100
+		if requestCount > 1 {
+			value = 150
+		}
+
+		_, _ = fmt.Fprintf(w, `
+# HELP requests_total Total requests
+# TYPE requests_total counter
+requests_total %d
+`, value)
+	}))
+	defer server.Close()
+
+	cfg := DefaultConfig()
+	cfg.URL = server.URL
+	cfg.Assertions = []AssertionConfig{
+		{
+			Name:     "delta_above_40",
+			Metric:   "requests_total",
+			Mode:     AssertionModeDelta,
+			Operator: OperatorGt,
+			Value:    40,
+		},
+	}
+
+	if err := cfg.Validate(); err != nil {
+		t.Fatalf("Validate() failed: %v", err)
+	}
+
+	logger := logrus.New()
+	logger.SetLevel(logrus.PanicLevel)
+
+	outputs := vars.NewVariables(nil)
+
+	var lastResult types.TaskResult
+
+	ctx := &types.TaskContext{
+		Outputs:        outputs,
+		SetResult:      func(r types.TaskResult) { lastResult = r },
+		ReportProgress: func(_ float64, _ string) {},
+	}
+
+	task := &Task{
+		ctx:        ctx,
+		config:     cfg,
+		logger:     logger,
+		baselines:  make(map[string]float64),
+		httpClient: &http.Client{Timeout: cfg.RequestTimeout.Duration},
+	}
+
+	// First scrape - records baseline, doesn't complete
+	done, err := task.runCheck(context.Background())
+	if err != nil {
+		t.Fatalf("first runCheck() error: %v", err)
+	}
+
+	if done {
+		t.Error("expected done=false on first scrape (baseline recording)")
+	}
+
+	// Second scrape - evaluates delta
+	done, err = task.runCheck(context.Background())
+	if err != nil {
+		t.Fatalf("second runCheck() error: %v", err)
+	}
+
+	if !done {
+		t.Error("expected done=true on second scrape")
+	}
+
+	if lastResult != types.TaskResultSuccess {
+		t.Errorf("result = %v, want TaskResultSuccess", lastResult)
+	}
+
+	// Verify delta output
+	deltas := outputs.GetVar("deltas")
+	if deltas == nil {
+		t.Fatal("deltas output not set")
+	}
+
+	deltasMap, ok := deltas.(map[string]any)
+	if !ok {
+		t.Fatalf("deltas type = %T, want map[string]any", deltas)
+	}
+
+	if delta, exists := deltasMap["delta_above_40"]; !exists || delta != 50.0 {
+		t.Errorf("deltas[delta_above_40] = %v, want 50.0", deltasMap["delta_above_40"])
+	}
+}
+
+func TestIntegration_MultipleAssertions(t *testing.T) {
+	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
+		_, _ = w.Write([]byte(`
+# HELP cpu_usage CPU usage percentage
+# TYPE cpu_usage gauge
+cpu_usage{host="server1"} 45.5
+cpu_usage{host="server2"} 78.2
+# HELP memory_usage Memory usage percentage
+# TYPE memory_usage gauge
+memory_usage{host="server1"} 60.0
+`))
+	}))
+	defer server.Close()
+
+	cfg := DefaultConfig()
+	cfg.URL = server.URL
+	cfg.Assertions = []AssertionConfig{
+		{
+			Name:     "server1_cpu_ok",
+			Metric:   "cpu_usage",
+			Labels:   map[string]string{testLabelHost: "server1"},
+			Mode:     AssertionModeValue,
+			Operator: OperatorLt,
+			Value:    50,
+		},
+		{
+			Name:     "server1_memory_ok",
+			Metric:   "memory_usage",
+			Labels:   map[string]string{testLabelHost: "server1"},
+			Mode:     AssertionModeValue,
+			Operator: OperatorLte,
+			Value:    60,
+		},
+		{
+			Name:     "server2_cpu_high",
+			Metric:   "cpu_usage",
+			Labels:   map[string]string{testLabelHost: "server2"},
+			Mode:     AssertionModeValue,
+			Operator: OperatorGt,
+			Value:    70,
+		},
+	}
+
+	if err := cfg.Validate(); err != nil {
+		t.Fatalf("Validate() failed: %v", err)
+	}
+
+	logger := logrus.New()
+	logger.SetLevel(logrus.PanicLevel)
+
+	outputs := vars.NewVariables(nil)
+
+	var lastResult types.TaskResult
+
+	ctx := &types.TaskContext{
+		Outputs:        outputs,
+		SetResult:      func(r types.TaskResult) { lastResult = r },
+		ReportProgress: func(_ float64, _ string) {},
+	}
+
+	task := &Task{
+		ctx:        ctx,
+		config:     cfg,
+		logger:     logger,
+		baselines:  make(map[string]float64),
+		httpClient: &http.Client{Timeout: cfg.RequestTimeout.Duration},
+	}
+
+	done, err := task.runCheck(context.Background())
+	if err != nil {
+		t.Fatalf("runCheck() error: %v", err)
+	}
+
+	if !done {
+		t.Error("expected done=true when all assertions pass")
+	}
+
+	if lastResult != types.TaskResultSuccess {
+		t.Errorf("result = %v, want TaskResultSuccess", lastResult)
+	}
+
+	// Verify all three passed
+	passed := outputs.GetVar("passedAssertions")
+	passedList, ok := passed.([]any)
+
+	if !ok {
+		t.Fatalf("passedAssertions type = %T, want []any", passed)
+	}
+
+	if len(passedList) != 3 {
+		t.Errorf("passedAssertions count = %d, want 3", len(passedList))
+	}
+
+	// Verify values output
+	values := outputs.GetVar("values")
+	valuesMap, ok := values.(map[string]any)
+
+	if !ok {
+		t.Fatalf("values type = %T, want map[string]any", values)
+	}
+
+	if v := valuesMap["server1_cpu_ok"]; v != 45.5 {
+		t.Errorf("values[server1_cpu_ok] = %v, want 45.5", v)
+	}
+}

From ae254d4c2727429ff5d80561754044480e3d38e7 Mon Sep 17 00:00:00 2001
From: Chetany Bhardwaj <chetanyiot@gmail.com>
Date: Mon, 1 Jun 2026 15:00:18 +0200
Subject: [PATCH 8/8] fix: add require annotations to Config.URL and
 Config.Assertions

---
 pkg/tasks/check_http_metrics/config.go | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/pkg/tasks/check_http_metrics/config.go b/pkg/tasks/check_http_metrics/config.go
index 8e7b73b3..af67d4e8 100644
--- a/pkg/tasks/check_http_metrics/config.go
+++ b/pkg/tasks/check_http_metrics/config.go
@@ -70,7 +70,7 @@ type AssertionConfig struct {
 // Config holds the task configuration for scraping a Prometheus metrics endpoint
 // and evaluating assertions against the scraped values.
 type Config struct {
-	URL             string            `yaml:"url" json:"url" desc:"HTTP URL of the Prometheus metrics endpoint."`
+	URL             string            `yaml:"url" json:"url" require:"A" desc:"HTTP URL of the Prometheus metrics endpoint."`
 	Headers         map[string]string `yaml:"headers" json:"headers" desc:"Optional HTTP request headers."`
 	PollInterval    helper.Duration   `yaml:"pollInterval" json:"pollInterval" desc:"Interval between metric scrapes."`
 	RequestTimeout  helper.Duration   `yaml:"requestTimeout" json:"requestTimeout" desc:"Timeout for a single HTTP request."`
@@ -80,7 +80,7 @@ type Config struct {
 	MissingMetric   MissingBehavior   `yaml:"missingMetric" json:"missingMetric" desc:"Behavior when metric doesn't exist: wait, fail, pass."`
 	MissingSeries   MissingBehavior   `yaml:"missingSeries" json:"missingSeries" desc:"Behavior when no series matches labels: wait, fail, pass."`
 	ResetBehavior   ResetBehavior     `yaml:"resetBehavior" json:"resetBehavior" desc:"Behavior on counter reset in delta mode: fail, rebaseline, ignore."`
-	Assertions      []AssertionConfig `yaml:"assertions" json:"assertions" desc:"List of metric assertions to evaluate."`
+	Assertions      []AssertionConfig `yaml:"assertions" json:"assertions" require:"B" desc:"List of metric assertions to evaluate."`
 
 	// Parsed values (not from YAML)
 	maxResponseSizeBytes int64