gravitational · fheinecke · Mar 19, 2024 · Mar 19, 2024 · Mar 19, 2024 · Mar 19, 2024
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,11 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
 ## [Unreleased]
+### Added
+- Added workflow elapsed time metric
+
+### Changed
+- Renamed `gha_workflow_run_time_seconds` to `gha_workflow_run_runner_seconds`
 
 ## [0.0.9] - 2024-03-18
 ### Fixed

diff --git a/collector.go b/collector.go
@@ -16,9 +16,15 @@ import (
 )
 
 var (
-	workflowRunTimeVec = prometheus.NewCounterVec(
+	workflowRunRunnerTimeVec = prometheus.NewCounterVec(
 		prometheus.CounterOpts{
-			Name: "gha_workflow_run_time_seconds",
+			Name: "gha_workflow_run_runner_seconds",
+		},
+		[]string{"repo", "ref", "event_type", "workflow"},
+	)
+	workflowRunElapsedTimeVec = prometheus.NewCounterVec(
+		prometheus.CounterOpts{
+			Name: "gha_workflow_run_elapsed_seconds",
 		},
 		[]string{"repo", "ref", "event_type", "workflow"},
 	)
@@ -67,7 +73,8 @@ type Collector struct {
 }
 
 func NewCollector(cfg *CLI) *Collector {
-	prometheus.MustRegister(workflowRunTimeVec)
+	prometheus.MustRegister(workflowRunRunnerTimeVec)
+	prometheus.MustRegister(workflowRunElapsedTimeVec)
 	prometheus.MustRegister(jobRunTimeVec)
 	prometheus.MustRegister(stepRunTimeVec)
 	prometheus.MustRegister(workflowRunCountVec)
@@ -199,6 +206,13 @@ func (c *Collector) collectJobs(ctx context.Context, repo string, run *github.Wo
 }
 
 func countJobs(run *github.WorkflowRun, jobs []*github.WorkflowJob) {
+	// The tool doesn't currently account for more than one run attempt.
+	// This brings a multitude of issues that are near-impossible to
+	// account for due to GH's API design.
+	if run.GetRunAttempt() > 1 {
+		return
+	}
+
 	workflowName := path.Base(run.GetPath())
 	workflowName = strings.TrimSuffix(workflowName, path.Ext(workflowName))
 	repo := run.GetRepository().GetName()
@@ -244,7 +258,8 @@ func countJobs(run *github.WorkflowRun, jobs []*github.WorkflowJob) {
 		return
 	}
 
-	workflowRunTimeVec.WithLabelValues(repo, ref, eventType, workflowName).Add(workflowRunTime.Seconds())
+	workflowRunRunnerTimeVec.WithLabelValues(repo, ref, eventType, workflowName).Add(workflowRunTime.Seconds())
+	workflowRunElapsedTimeVec.WithLabelValues(repo, ref, eventType, workflowName).Add(run.GetUpdatedAt().Sub(run.GetCreatedAt().Time).Seconds())
 }
 
 func makeRef(run *github.WorkflowRun) string {

diff --git a/metrics.md b/metrics.md
@@ -43,16 +43,27 @@ A `counter` of the run time of jobs in a workflow. This is a sum of the
 Same as `gha_step_run_time_seconds` but without the `step` label.
 
 
-## `gha_workflow_run_time_seconds`
+## `gha_workflow_run_runner_seconds`
 
-A `counter` of the run time of a workflow. This is a sum of the
+A `counter` of the runner run time of a workflow. This is a sum of the
 `gha_job_run_time_seconds` for a particular job instance (job ID in GHA).
 
 ### Labels
 
 Same as `gha_job_run_time_seconds` but without the `job` label.
 
 
+## `gha_workflow_run_elapsed_seconds`
+
+A `counter` of the elapsed run time of a workflow. This is a "wall clock
+time", or how much time passed between when a run was created and when it
+ended.
+
+### Labels
+
+Same as `gha_job_run_time_seconds` but without the `job` label.
+
+
 ## `gha_step_run_count`
 
 A `counter` of the number of runs of a step by conclusion.