firebase-cpp-sdk/scripts/print_workflow_run_errors.py at 2551c111d25337be9813d775a2e59d8edd8b848a · firebase/firebase-cpp-sdk · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
#!/usr/bin/env python3
# Copyright 2024 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Fetches and prints errors from a GitHub Workflow run."""

import argparse
import os
import sys
import datetime
import requests
import json
import re
import subprocess
from requests.adapters import HTTPAdapter
from requests.packages.urllib3.util.retry import Retry

# Constants for GitHub API interaction
RETRIES = 3
BACKOFF = 5
RETRY_STATUS = (403, 500, 502, 504)  # HTTP status codes to retry on
TIMEOUT = 10  # Default timeout for requests in seconds
LONG_TIMEOUT = 30 # Timeout for potentially longer requests like log downloads

# Global variables for the target repository, populated by set_repo_info()
OWNER = ''
REPO = ''
BASE_URL = 'https://api.github.com'
GITHUB_API_URL = ''


def set_repo_info(owner_name, repo_name):
  """Sets the global repository owner, name, and API URL."""
  global OWNER, REPO, GITHUB_API_URL
  OWNER = owner_name
  REPO = repo_name
  GITHUB_API_URL = f'{BASE_URL}/repos/{OWNER}/{REPO}'
  return True


def requests_retry_session(retries=RETRIES,
                           backoff_factor=BACKOFF,
                           status_forcelist=RETRY_STATUS):
  """Creates a requests session with retry logic."""
  session = requests.Session()
  retry = Retry(total=retries,
                read=retries,
                connect=retries,
                backoff_factor=backoff_factor,
                status_forcelist=status_forcelist)
  adapter = HTTPAdapter(max_retries=retry)
  session.mount('http://', adapter)
  session.mount('https://', adapter)
  return session


def get_current_branch_name():
    """Gets the current git branch name."""
    try:
        branch_bytes = subprocess.check_output(["git", "rev-parse", "--abbrev-ref", "HEAD"], stderr=subprocess.PIPE)
        return branch_bytes.decode().strip()
    except (subprocess.CalledProcessError, FileNotFoundError, UnicodeDecodeError) as e:
        sys.stderr.write(f"Info: Could not determine current git branch via 'git rev-parse --abbrev-ref HEAD': {e}. Branch will need to be specified.\n")
        return None
    except Exception as e: # Catch any other unexpected error.
        sys.stderr.write(f"Info: An unexpected error occurred while determining current git branch: {e}. Branch will need to be specified.\n")
        return None


def main():
  """Main function to parse arguments and orchestrate the script."""
  determined_owner = None
  determined_repo = None
  try:
    git_url_bytes = subprocess.check_output(["git", "remote", "get-url", "origin"], stderr=subprocess.PIPE)
    git_url = git_url_bytes.decode().strip()
    match = re.search(r"(?:(?:https?://github\.com/)|(?:git@github\.com:))([^/]+)/([^/.]+)(?:\.git)?", git_url)
    if match:
      determined_owner = match.group(1)
      determined_repo = match.group(2)
      sys.stderr.write(f"Determined repository: {determined_owner}/{determined_repo} from git remote 'origin'.\n")
  except (subprocess.CalledProcessError, FileNotFoundError, UnicodeDecodeError) as e:
    sys.stderr.write(f"Could not automatically determine repository from git remote 'origin': {e}\n")
  except Exception as e:
    sys.stderr.write(f"An unexpected error occurred while determining repository: {e}\n")

  def parse_repo_url_arg(url_string):
    """Parses owner and repository name from various GitHub URL formats."""
    url_match = re.search(r"(?:(?:https?://github\.com/)|(?:git@github\.com:))([^/]+)/([^/.]+?)(?:\.git)?/?$", url_string)
    if url_match:
        return url_match.group(1), url_match.group(2)
    return None, None

  current_branch = get_current_branch_name()

  parser = argparse.ArgumentParser(
      description="Fetch and display failed steps and their logs from a GitHub workflow run.",
      formatter_class=argparse.RawTextHelpFormatter
  )
  parser.add_argument(
      "--workflow", "--workflow-name",
      type=str,
      default="integration_test.yml",
      help="Name of the workflow file (e.g., 'main.yml' or 'build-test.yml'). Default: 'integration_test.yml'."
  )
  parser.add_argument(
      "--branch",
      type=str,
      default=current_branch,
      help=f"GitHub branch name to check for the workflow run. {'Default: ' + current_branch if current_branch else 'Required if not determinable from current git branch.'}"
  )
  parser.add_argument(
      "--url",
      type=str,
      default=None,
      help="Full GitHub repository URL (e.g., https://github.com/owner/repo or git@github.com:owner/repo.git). Takes precedence over --owner/--repo."
  )
  parser.add_argument(
      "--owner",
      type=str,
      default=determined_owner,
      help=f"Repository owner. Used if --url is not provided. {'Default: ' + determined_owner if determined_owner else 'Required if --url is not used and not determinable from git.'}"
  )
  parser.add_argument(
      "--repo",
      type=str,
      default=determined_repo,
      help=f"Repository name. Used if --url is not provided. {'Default: ' + determined_repo if determined_repo else 'Required if --url is not used and not determinable from git.'}"
  )
  parser.add_argument(
      "--token",
      type=str,
      default=os.environ.get("GITHUB_TOKEN"),
      help="GitHub token. Can also be set via GITHUB_TOKEN env var or from ~/.github_token."
  )
  parser.add_argument(
      "--log-lines",
      type=int,
      default=100,
      help="Number of lines to print from the end of each failed step's log. Default: 100."
  )
  parser.add_argument(
      "--all-failed-steps",
      action="store_true",
      default=False,
      help="If set, print logs for all failed steps in a job. Default is to print logs only for the first failed step."
  )
  parser.add_argument(
      "--grep-pattern", "-g",
      type=str,
      default=None,
      help="Extended Regular Expression (ERE) to search for in logs. If provided, log output will be filtered by grep."
  )
  parser.add_argument(
      "--grep-context", "-C",
      type=int,
      default=5,
      help="Number of lines of leading and trailing context to print for grep matches. Default: 5."
  )

  args = parser.parse_args()
  error_suffix = " (use --help for more details)"

  token = args.token
  if not token:
    try:
      with open(os.path.expanduser("~/.github_token"), "r") as f:
        token = f.read().strip()
      if token:
        sys.stderr.write("Using token from ~/.github_token\n")
    except FileNotFoundError:
      pass
    except Exception as e:
      sys.stderr.write(f"Warning: Could not read ~/.github_token: {e}\n")

  if not token:
    sys.stderr.write(f"Error: GitHub token not provided. Set GITHUB_TOKEN, use --token, or place it in ~/.github_token.{error_suffix}\n")
    sys.exit(1)
  args.token = token # Ensure args.token is populated

  final_owner = None
  final_repo = None

  if args.url:
    owner_explicitly_set_via_arg = args.owner is not None and args.owner != determined_owner
    repo_explicitly_set_via_arg = args.repo is not None and args.repo != determined_repo
    if owner_explicitly_set_via_arg or repo_explicitly_set_via_arg:
        sys.stderr.write(f"Error: Cannot use --owner or --repo when --url is specified.{error_suffix}\n")
        sys.exit(1)

    parsed_owner, parsed_repo = parse_repo_url_arg(args.url)
    if parsed_owner and parsed_repo:
        final_owner = parsed_owner
        final_repo = parsed_repo
        sys.stderr.write(f"Using repository from --url: {final_owner}/{final_repo}\n")
    else:
        sys.stderr.write(f"Error: Invalid URL format: {args.url}. Expected https://github.com/owner/repo or git@github.com:owner/repo.git{error_suffix}\n")
        sys.exit(1)
  else:
    is_owner_from_user_arg = args.owner is not None and args.owner != determined_owner
    is_repo_from_user_arg = args.repo is not None and args.repo != determined_repo

    if is_owner_from_user_arg or is_repo_from_user_arg: # User explicitly set at least one of owner/repo via args
        if args.owner and args.repo:
            final_owner = args.owner
            final_repo = args.repo
            sys.stderr.write(f"Using repository from --owner/--repo args: {final_owner}/{final_repo}\n")
        else:
            sys.stderr.write(f"Error: Both --owner and --repo must be specified if one is provided explicitly (and --url is not used).{error_suffix}\n")
            sys.exit(1)
    elif args.owner and args.repo: # Both args have values, likely from successful auto-detection (or user provided matching defaults)
        final_owner = args.owner
        final_repo = args.repo
        # No specific message needed if it's from auto-detection, already printed.
        # If user explicitly provided args that match auto-detected, that's fine.
    # If final_owner/repo are still None here, it means auto-detection failed AND user provided nothing for owner/repo.
    # Or, only one of owner/repo was auto-detected and the other wasn't provided.

  if not final_owner or not final_repo:
    missing_parts = []
    if not final_owner: missing_parts.append("--owner")
    if not final_repo: missing_parts.append("--repo")

    error_msg = "Error: Could not determine repository."
    if missing_parts:
        error_msg += f" Missing { ' and '.join(missing_parts) }."
    error_msg += f" Please specify --url, OR both --owner and --repo, OR ensure git remote 'origin' is configured correctly.{error_suffix}"
    sys.stderr.write(error_msg + "\n")
    sys.exit(1)

  if not set_repo_info(final_owner, final_repo):
    # This path should ideally not be reached if final_owner/repo are validated,
    # but as a safeguard:
    sys.stderr.write(f"Error: Could not set repository info to {final_owner}/{final_repo}. Ensure owner/repo are correct.{error_suffix}\n")
    sys.exit(1)

  if not args.branch:
      sys.stderr.write(f"Error: Branch name is required. Please specify --branch or ensure it can be detected from your current git repository.{error_suffix}\n")
      sys.exit(1)

  sys.stderr.write(f"Processing workflow '{args.workflow}' on branch '{args.branch}' for repo {OWNER}/{REPO}\n")

  run = get_latest_workflow_run(args.token, args.workflow, args.branch)
  if not run:
    sys.stderr.write(f"No workflow run found for workflow '{args.workflow}' on branch '{args.branch}'.\n")
    sys.exit(0)

  sys.stderr.write(f"Found workflow run ID: {run['id']} (Status: {run.get('status')}, Conclusion: {run.get('conclusion')})\n")

  failed_jobs = get_failed_jobs_for_run(args.token, run['id'])

  if not failed_jobs:
    sys.stderr.write(f"No failed jobs found for workflow run ID: {run['id']}.\n")
    if run.get('conclusion') == 'success':
        print(f"Workflow run {run['id']} completed successfully with no failed jobs.")
    elif run.get('status') == 'in_progress' and run.get('conclusion') is None:
        print(f"Workflow run {run['id']} is still in progress. No failed jobs reported yet.")
    else:
        # This case might indicate the workflow failed but not at a job level,
        # or jobs are still pending/running.
        print(f"Workflow run {run['id']} has conclusion '{run.get('conclusion')}' but no specific failed jobs were identified by this script's criteria.")
    sys.exit(0)

  print(f"\n--- Failed Jobs for Workflow Run ID: {run['id']} ({run.get('html_url', 'No URL')}) ---\n")

  for job in failed_jobs:
    print(f"==================================================================================")
    print(f"Job: {job['name']} (ID: {job['id']}) - FAILED")
    print(f"Job URL: {job.get('html_url', 'N/A')}")
    print(f"==================================================================================")

    job_logs = get_job_logs(args.token, job['id'])
    if not job_logs:
      print("Could not retrieve logs for this job.")
      continue

    failed_steps_details = []
    if job.get('steps'):
        for step in job['steps']:
            if step.get('conclusion') == 'failure':
                failed_steps_details.append(step)

    if not failed_steps_details:
        print("\nNo specific failed steps found in job data, but job marked as failed. Printing last lines of full job log as fallback:\n")
        log_lines = job_logs.splitlines()
        for line in log_lines[-args.log_lines:]:
            print(line)
        print("\n--- End of log snippet for job ---")
        continue

    print(f"\n--- Failed Steps in Job: {job['name']} ---")
    first_failed_step_logged = False
    for step in failed_steps_details:
      if not args.all_failed_steps and first_failed_step_logged:
        print(f"\n--- Skipping subsequent failed step: {step.get('name', 'Unnamed step')} (use --all-failed-steps to see all) ---")
        break # Stop after the first failed step if not --all-failed-steps

      step_name = step.get('name', 'Unnamed step')
      print(f"\n--- Step: {step_name} ---")

      # Crude log extraction:
      # Regex to match group start, attempting to capture the step name robustly
      escaped_step_name = re.escape(step_name)
      step_start_pattern = re.compile(r"^##\[group\](?:Run\s+|Setup\s+|Complete\s+)?.*?" + escaped_step_name, re.IGNORECASE)
      step_end_pattern = re.compile(r"^##\[endgroup\]")

      current_step_log_segment = []
      capturing_for_failed_step = False
      log_lines_for_job = job_logs.splitlines() # Split once per job

      # Try to find the specific step's log segment
      for line in log_lines_for_job:
          if step_start_pattern.search(line):
              capturing_for_failed_step = True
              current_step_log_segment = [line] # Start with the group line
              continue
          if capturing_for_failed_step:
              current_step_log_segment.append(line)
              if step_end_pattern.search(line):
                  capturing_for_failed_step = False
                  # Found the end of the targeted step's log
                  break # Stop processing lines for this step (within this job's logs)

      log_to_process = ""
      log_source_message = ""

      if current_step_log_segment:
          log_to_process = "\n".join(current_step_log_segment)
          log_source_message = f"Log for failed step '{step_name}'"
      else:
          log_to_process = "\n".join(log_lines_for_job) # Use the full job log as fallback
          log_source_message = f"Could not isolate log for step '{step_name}'. Using entire job log"

      if args.grep_pattern:
          print(f"{log_source_message} (grep results for pattern '{args.grep_pattern}' with context {args.grep_context}):")
          try:
              # Using subprocess to call grep
              # Pass log_to_process as stdin to grep
              process = subprocess.run(
                  ['grep', '-E', f"-C{args.grep_context}", args.grep_pattern],
                  input=log_to_process,
                  text=True,
                  capture_output=True,
                  check=False # Do not throw exception on non-zero exit (e.g. no match)
              )
              if process.returncode == 0: # Match found
                  print(process.stdout.strip())
              elif process.returncode == 1: # No match found
                  print(f"No matches found for pattern '{args.grep_pattern}' in this log segment.")
              else: # Grep error
                  sys.stderr.write(f"Grep command failed with error code {process.returncode}:\n{process.stderr}\n")
          except FileNotFoundError:
              sys.stderr.write("Error: 'grep' command not found. Please ensure it is installed and in your PATH to use --grep-pattern.\n")
              # Fallback to printing last N lines if grep is not found? Or just skip log? For now, skip.
              print("Skipping log display for this step as grep is unavailable.")
          except Exception as e:
              sys.stderr.write(f"An unexpected error occurred while running grep: {e}\n")
              print("Skipping log display due to an error with grep.")
      else:
          # Default behavior: print last N lines
          print(f"{log_source_message} (last {args.log_lines} lines):")
          # current_step_log_segment is a list of lines, log_lines_for_job is also a list of lines
          lines_to_print_from = current_step_log_segment if current_step_log_segment else log_lines_for_job
          for log_line in lines_to_print_from[-args.log_lines:]:
              print(log_line)

      print(f"--- End of log for step: {step_name} ---")
      first_failed_step_logged = True # Mark that we've logged at least one step

    print(f"\n--- End of Failed Steps for Job: {job['name']} ---\n")


def get_latest_workflow_run(token, workflow_name, branch_name):
  """Fetches the most recent workflow run for a given workflow name and branch."""
  url = f'{GITHUB_API_URL}/actions/workflows/{workflow_name}/runs'
  headers = {'Accept': 'application/vnd.github.v3+json', 'Authorization': f'token {token}'}
  params = {'branch': branch_name, 'per_page': 1, 'page': 1} # Get the most recent 1

  try:
    with requests_retry_session().get(url, headers=headers, params=params, timeout=TIMEOUT) as response:
      response.raise_for_status()
      data = response.json()
      if data['workflow_runs'] and len(data['workflow_runs']) > 0:
        return data['workflow_runs'][0] # The first one is the most recent
      else:
        return None
  except requests.exceptions.RequestException as e:
    sys.stderr.write(f"Error: Failed to fetch workflow runs for '{workflow_name}' on branch '{branch_name}': {e}\n")
    if e.response is not None:
        sys.stderr.write(f"Response content: {e.response.text}\n")
    return None
  except json.JSONDecodeError as e:
    sys.stderr.write(f"Error: Failed to parse JSON response for workflow runs: {e}\n")
    return None


def get_failed_jobs_for_run(token, run_id):
  """Fetches all jobs for a given workflow run and filters for failed ones."""
  url = f'{GITHUB_API_URL}/actions/runs/{run_id}/jobs'
  headers = {'Accept': 'application/vnd.github.v3+json', 'Authorization': f'token {token}'}

  page = 1
  per_page = 100 # GitHub API default and max is 100 for many paginated endpoints
  all_jobs = []

  while True:
    params = {'per_page': per_page, 'page': page, 'filter': 'latest'} # 'latest' attempt for each job
    try:
      with requests_retry_session().get(url, headers=headers, params=params, timeout=TIMEOUT) as response:
        response.raise_for_status()
        data = response.json()
        current_page_jobs = data.get('jobs', [])
        if not current_page_jobs:
          break
        all_jobs.extend(current_page_jobs)
        if len(current_page_jobs) < per_page:
          break # Reached last page
        page += 1
    except requests.exceptions.RequestException as e:
      sys.stderr.write(f"Error: Failed to fetch jobs for run ID {run_id} (page {page}): {e}\n")
      if e.response is not None:
        sys.stderr.write(f"Response content: {e.response.text}\n")
      return None # Return None if any page fails
    except json.JSONDecodeError as e:
      sys.stderr.write(f"Error: Failed to parse JSON response for jobs: {e}\n")
      return None

  failed_jobs = [job for job in all_jobs if job.get('conclusion') == 'failure']
  return failed_jobs


def get_job_logs(token, job_id):
  """Downloads the logs for a specific job."""
  url = f'{GITHUB_API_URL}/actions/jobs/{job_id}/logs'
  headers = {'Accept': 'application/vnd.github.v3+json', 'Authorization': f'token {token}'}

  try:
    # Logs can be large, use a longer timeout and stream if necessary,
    # but for typical use, direct content might be fine.
    # The GitHub API for logs redirects to a download URL. `requests` handles this.
    with requests_retry_session().get(url, headers=headers, timeout=LONG_TIMEOUT, stream=False) as response:
      response.raise_for_status()
      # The response for logs is plain text, not JSON
      return response.text
  except requests.exceptions.RequestException as e:
    sys.stderr.write(f"Error: Failed to download logs for job ID {job_id}: {e}\n")
    if e.response is not None:
        # Log URLs might expire or have other issues, content might be HTML error page
        sys.stderr.write(f"Response status: {e.response.status_code}\n")
        # Avoid printing potentially huge HTML error pages to stderr directly
        # sys.stderr.write(f"Response content: {e.response.text[:500]}...\n") # Print a snippet
    return None


if __name__ == "__main__":
  main()