[llvm] [CI] Track Queue/In Progress Metrics By Job Rather Than Workflow (PR #127274)
Aiden Grossman via llvm-commits
llvm-commits at lists.llvm.org
Fri Feb 14 15:31:49 PST 2025
https://github.com/boomanaiden154 created https://github.com/llvm/llvm-project/pull/127274
This patch makes it so that the metrics container counts the number of in
progress and queued jobs at the job level rather than at the workflow
level. This helps us distinguish windows versus linux load and also lets
us filter out the MacOS jobs that only run in the release branch.
>From 38d3ff227b9caf9cf062c979417605c52dff2a0d Mon Sep 17 00:00:00 2001
From: Aiden Grossman <aidengrossman at google.com>
Date: Fri, 14 Feb 2025 23:31:39 +0000
Subject: [PATCH] =?UTF-8?q?[=F0=9D=98=80=F0=9D=97=BD=F0=9D=97=BF]=20initia?=
=?UTF-8?q?l=20version?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit
Created using spr 1.3.4
---
.ci/metrics/metrics.py | 67 ++++++++++++++++++++++++++----------------
1 file changed, 41 insertions(+), 26 deletions(-)
diff --git a/.ci/metrics/metrics.py b/.ci/metrics/metrics.py
index 70b787665a8b9..d05444bb9ff80 100644
--- a/.ci/metrics/metrics.py
+++ b/.ci/metrics/metrics.py
@@ -47,36 +47,51 @@ def get_sampled_workflow_metrics(github_repo: github.Repository):
# Other states are available (pending, waiting, etc), but the meaning
# is not documented (See #70540).
# "queued" seems to be the info we want.
- queued_workflow_count = len(
- [
- x
- for x in github_repo.get_workflow_runs(status="queued")
- if x.name in WORKFLOWS_TO_TRACK
- ]
- )
- running_workflow_count = len(
- [
- x
- for x in github_repo.get_workflow_runs(status="in_progress")
- if x.name in WORKFLOWS_TO_TRACK
- ]
- )
+ queued_job_counts = {}
+ for queued_workflow in github_repo.get_workflow_runs(status="queued"):
+ if queued_workflow.name not in WORKFLOWS_TO_TRACK:
+ continue
+ for queued_workflow_job in queued_workflow.jobs():
+ job_name = queued_workflow_job.name
+ if queued_workflow_job.status != "queued":
+ continue
+
+ if job_name not in queued_job_counts:
+ queued_job_counts[job_name] = 1
+ else:
+ queued_job_counts[job_name] += 1
+
+ running_job_counts = {}
+ for running_workflow in github_repo.get_workflow_runs(status="in_progress"):
+ if running_workflow.name not in WORKFLOWS_TO_TRACK:
+ continue
+ for running_workflow_job in running_workflow.jobs():
+ job_name = running_workflow_job.name
+ if running_workflow_job.status != "in_progress":
+ continue
+
+ if job_name not in running_job_counts:
+ running_job_counts[job_name] = 1
+ else:
+ running_job_counts[job_name] += 1
workflow_metrics = []
- workflow_metrics.append(
- GaugeMetric(
- "workflow_queue_size",
- queued_workflow_count,
- time.time_ns(),
+ for queued_job in queued_job_counts:
+ workflow_metrics.append(
+ GaugeMetric(
+ f"workflow_queue_size_{queued_job}",
+ queued_job_counts[queued_job],
+ time.time_ns(),
+ )
)
- )
- workflow_metrics.append(
- GaugeMetric(
- "running_workflow_count",
- running_workflow_count,
- time.time_ns(),
+ for running_job in running_job_counts:
+ workflow_metrics.append(
+ GaugeMetric(
+ f"running_workflow_count_{running_job}",
+ running_job_counts[running_job],
+ time.time_ns(),
+ )
)
- )
# Always send a hearbeat metric so we can monitor is this container is still able to log to Grafana.
workflow_metrics.append(
GaugeMetric("metrics_container_heartbeat", 1, time.time_ns())
More information about the llvm-commits
mailing list