openshift-eng · pmtk · Jul 3, 2026 · Jul 3, 2026 · Jul 3, 2026 · Jul 3, 2026
diff --git a/plugins/shared/scripts/aggregate.py b/plugins/shared/scripts/aggregate.py
@@ -25,6 +25,137 @@
 from parse import parse_structured_summary, group_by_signature
 
 
+# ---------------------------------------------------------------------------
+# Detected-job ground truth (deterministic overlay)
+#
+# The prepare phase's jobs/release-<v>-jobs.json and jobs/prs-jobs.json list
+# every detected failed job.  Aggregation starts from that list and joins the
+# parsed analyses onto it; detected jobs with no parsed analysis become
+# explicit placeholders in a separate missing_analysis array, so a job can
+# never silently vanish between detection and the HTML report.
+# ---------------------------------------------------------------------------
+
+def _detected_job(workdir, entry):
+    build_id = entry.get("build_id", "")
+    finished = ""
+    if build_id:
+        evidence_path = os.path.join(workdir, "evidence", f"evidence-{build_id}.json")
+        try:
+            with open(evidence_path) as f:
+                finished = (json.load(f).get("finished") or "")[:10]
+        except (OSError, json.JSONDecodeError):
+            pass
+    return {
+        "job_name": entry.get("job", ""),
+        "job_url": entry.get("url", ""),
+        "build_id": build_id,
+        "download_error": entry.get("download_error", ""),
+        "finished": finished,
+    }
+
+
+def load_detected_release_jobs(workdir, release):
+    """Read jobs/release-<release>-jobs.json into detected-job dicts.
+
+    Returns None when the file is missing or unreadable (distinct from []),
+    so callers can fall back to legacy file-glob behavior.
+    """
+    path = os.path.join(workdir, "jobs", f"release-{release}-jobs.json")
+    try:
+        with open(path) as f:
+            entries = json.load(f)
+    except (OSError, json.JSONDecodeError):
+        return None
+    if not isinstance(entries, list):
+        return None
+    jobs = []
+    for entry in entries:
+        if not isinstance(entry, dict):
+            continue
+        # Release job lists only contain failures; tolerate a status field.
+        status = entry.get("status", "")
+        if status and status.upper() != "FAILURE":
+            continue
+        jobs.append(_detected_job(workdir, entry))
+    return jobs
+
+
+def load_detected_pr_jobs(workdir):
+    """Read jobs/prs-jobs.json into {pr_number: [detected-job dicts]}.
+
+    prs-jobs.json includes SUCCESS/pending jobs of PRs that had at least one
+    failure; only FAILURE entries count as detected (same filter as
+    plan-analysis.py).  Returns None when the file is missing or unreadable.
+    """
+    path = os.path.join(workdir, "jobs", "prs-jobs.json")
+    try:
+        with open(path) as f:
+            entries = json.load(f)
+    except (OSError, json.JSONDecodeError):
+        return None
+    if not isinstance(entries, list):
+        return None
+    prs = {}
+    for entry in entries:
+        if not isinstance(entry, dict):
+            continue
+        if entry.get("status", "").upper() != "FAILURE":
+            continue
+        pr_number = entry.get("pr_number") or 0
+        prs.setdefault(pr_number, []).append(_detected_job(workdir, entry))
+    return prs
+
+
+def _file_build_id(filepath):
+    """Extract the build id from a per-job report filename.
+
+    Both shapes end in -<build_id>.txt:
+    release-<v>-job-<i>-<build_id>.txt and prs-job-<i>-pr<N>-<build_id>.txt.
+    """
+    m = re.search(r"-(\d+)\.txt$", os.path.basename(filepath))
+    return m.group(1) if m else ""
+
+
+def _placeholder(job):
+    """Missing-analysis entry for a detected job with no parsed report.
+
+    Deliberately carries no fingerprint/severity/stack_layer: placeholders
+    live outside issues[] and must never look like analyzed failures to
+    downstream consumers.
+    """
+    if job.get("download_error"):
+        reason = "artifact download failed"
+    elif not job.get("build_id"):
+        reason = "no build id"
+    else:
+        reason = "analysis report missing or unparseable"
+    return {
+        "job_name": job.get("job_name", ""),
+        "job_url": job.get("job_url", ""),
+        "build_id": job.get("build_id", ""),
+        "finished": job.get("finished", ""),
+        "reason": reason,
+    }
+
+
+def _missing_placeholders(detected, parsed):
+    """Placeholders for detected jobs not covered by any parsed entry.
+
+    Join primarily on build_id (attached to parsed entries from their
+    filename), with job_url as a defensive fallback.
+    """
+    covered_ids = {e.get("build_id") for e in parsed if e.get("build_id")}
+    covered_urls = {e.get("job_url") for e in parsed if e.get("job_url")}
+    missing = []
+    for job in detected:
+        if job.get("build_id") and job["build_id"] in covered_ids:
+            continue
+        if job.get("job_url") and job["job_url"] in covered_urls:
+            continue
+        missing.append(_placeholder(job))
+    return missing
+
+
 def classify_severity(group):
     count = len(group)
     if count >= 5:
@@ -40,16 +171,23 @@ def classify_severity(group):
 # JSON generation
 # ---------------------------------------------------------------------------
 
-def build_release_json(release, jobs, timestamp):
-    """Build the release summary as a dict (ready for json.dump)."""
+def build_release_json(release, jobs, timestamp, detected=None):
+    """Build the release summary as a dict (ready for json.dump).
+
+    When the detected-job list is available, total_failed is the detected
+    count (not the parsed-entry count, which can under- and over-count) and
+    detected jobs with no parsed analysis are listed in missing_analysis.
+    """
     issues, breakdown = _build_issues_from_jobs(jobs)
+    missing = _missing_placeholders(detected, jobs) if detected is not None else []
 
     return {
         "release": release,
-        "total_failed": len(jobs),
+        "total_failed": len(detected) if detected is not None else len(jobs),
         "date": timestamp.strftime("%Y-%m-%d"),
         "breakdown": breakdown,
         "issues": issues,
+        "missing_analysis": missing,
     }
 
 
@@ -92,38 +230,51 @@ def _build_issues_from_jobs(jobs):
             "analysis_gaps": rep.get("analysis_gaps", []),
             "scenarios": sorted({s for j in group for s in j.get("scenarios", [])}),
             "affected_jobs": [
-                {"name": j["job_name"], "date": j["finished"], "url": j["job_url"]}
+                {"name": j["job_name"], "date": j["finished"], "url": j["job_url"],
+                 "build_id": j.get("build_id", "")}
                 for j in group
             ],
         })
 
     return issues, breakdown
 
 
-def build_pr_json(pr_jobs, timestamp):
+def build_pr_json(pr_jobs, timestamp, detected_prs=None):
     """Build the PR summary as a dict (ready for json.dump).
 
-    pr_jobs: dict mapping pr_number to list of job dicts.
+    pr_jobs: dict mapping pr_number to list of parsed job dicts.
+    detected_prs: dict mapping pr_number to detected-job dicts (ground
+    truth), or None when prs-jobs.json is unavailable.  When available,
+    per-PR failed counts come from the detected list and unanalyzed jobs
+    are listed per PR in missing_analysis — including PRs where no report
+    parsed at all.
     """
-    total_failed = sum(len(jobs) for jobs in pr_jobs.values())
+    pr_numbers = sorted(set(pr_jobs) | set(detected_prs or {}))
 
+    total_failed = 0
     prs = []
-    for pr_number, jobs in sorted(pr_jobs.items()):
-        if not jobs:
+    for pr_number in pr_numbers:
+        jobs = pr_jobs.get(pr_number, [])
+        detected = (detected_prs or {}).get(pr_number)
+        missing = _missing_placeholders(detected, jobs) if detected is not None else []
+        if not jobs and not missing:
             continue
-        first = jobs[0]
+        failed = len(detected) if detected is not None else len(jobs)
+        total_failed += failed
+        first = jobs[0] if jobs else {}
         issues, breakdown = _build_issues_from_jobs(jobs)
         prs.append({
             "number": pr_number,
             "title": first.get("pr_title", ""),
             "url": first.get("pr_url", ""),
-            "failed": len(jobs),
+            "failed": failed,
             "breakdown": breakdown,
             "issues": issues,
+            "missing_analysis": missing,
         })
 
     return {
-        "total_prs": len(pr_jobs),
+        "total_prs": len(pr_numbers) if detected_prs is not None else len(pr_jobs),
         "prs_with_failures": len(prs),
         "total_failed": total_failed,
         "date": timestamp.strftime("%Y-%m-%d"),
@@ -205,25 +356,40 @@ def main():
     timestamp = datetime.now(timezone.utc)
 
     if mode == "release":
+        # A recorded collection error must keep rendering as such —
+        # create-report.py falls back to release-<v>-error.txt only when
+        # the summary file is absent, so do not write one.
+        error_path = os.path.join(workdir, "jobs", f"release-{release}-error.txt")
+        if os.path.exists(error_path):
+            print(f"Collection error recorded for release {release}; "
+                  f"not writing a summary", file=sys.stderr)
+            sys.exit(0)
+
+        detected = load_detected_release_jobs(workdir, release)
         files = find_release_job_files(workdir, release)
-        if not files:
+        if detected is None and not files:
             print(f"No job files found for release {release}", file=sys.stderr)
             sys.exit(1)
 
-        print(f"Found {len(files)} job files for release {release}", file=sys.stderr)
+        print(f"Found {len(files)} job files for release {release}"
+              + (f" ({len(detected)} detected failed jobs)" if detected is not None else ""),
+              file=sys.stderr)
         jobs = []
         for filepath in files:
             summaries = parse_structured_summary(filepath)
             if not summaries:
                 print(f"  WARNING: no STRUCTURED SUMMARY in {os.path.basename(filepath)}", file=sys.stderr)
                 continue
+            build_id = _file_build_id(filepath)
+            for summary in summaries:
+                summary["build_id"] = build_id
             jobs.extend(summaries)
 
-        if not jobs:
+        if detected is None and not jobs:
             print("No valid job reports found", file=sys.stderr)
             sys.exit(1)
 
-        result = build_release_json(release, jobs, timestamp)
+        result = build_release_json(release, jobs, timestamp, detected=detected)
         jobs_dir = os.path.join(workdir, "jobs")
         os.makedirs(jobs_dir, exist_ok=True)
         output_path = os.path.join(jobs_dir, f"release-{release}-summary.json")
@@ -233,27 +399,29 @@ def main():
         print(json.dumps(result, indent=2))
 
     elif mode == "prs":
+        detected_prs = load_detected_pr_jobs(workdir)
         files = find_pr_job_files(workdir)
         if not files:
             print("No PR job files found", file=sys.stderr)
-            result = build_pr_json({}, timestamp)
         else:
             print(f"Found {len(files)} PR job files", file=sys.stderr)
-            pr_jobs = {}
-            for filepath in files:
-                summaries = parse_structured_summary(filepath)
-                if not summaries:
-                    print(f"  WARNING: no STRUCTURED SUMMARY in {os.path.basename(filepath)}", file=sys.stderr)
-                    continue
-                for summary in summaries:
-                    summary["pr_title"] = ""
-                    summary["pr_url"] = ""
-
-                m = re.search(r"-pr(\d+)-", os.path.basename(filepath))
-                pr_number = int(m.group(1)) if m else 0
-                pr_jobs.setdefault(pr_number, []).extend(summaries)
-
-            result = build_pr_json(pr_jobs, timestamp)
+        pr_jobs = {}
+        for filepath in files:
+            summaries = parse_structured_summary(filepath)
+            if not summaries:
+                print(f"  WARNING: no STRUCTURED SUMMARY in {os.path.basename(filepath)}", file=sys.stderr)
+                continue
+            build_id = _file_build_id(filepath)
+            for summary in summaries:
+                summary["pr_title"] = ""
+                summary["pr_url"] = ""
+                summary["build_id"] = build_id
+
+            m = re.search(r"-pr(\d+)-", os.path.basename(filepath))
+            pr_number = int(m.group(1)) if m else 0
+            pr_jobs.setdefault(pr_number, []).extend(summaries)
+
+        result = build_pr_json(pr_jobs, timestamp, detected_prs)
 
         jobs_dir = os.path.join(workdir, "jobs")
         os.makedirs(jobs_dir, exist_ok=True)