extract warnings in GH workflows (#20487)
Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
This commit is contained in:
@@ -11,40 +11,54 @@ from transformers import logging
|
||||
logger = logging.get_logger(__name__)
|
||||
|
||||
|
||||
def extract_warnings_from_single_artifact(artifact_zip_path, targets):
|
||||
def extract_warnings_from_single_artifact(artifact_path, targets):
|
||||
"""Extract warnings from a downloaded artifact (in .zip format)"""
|
||||
selected_warnings = set()
|
||||
buffer = []
|
||||
|
||||
try:
|
||||
with zipfile.ZipFile(artifact_zip_path) as z:
|
||||
for filename in z.namelist():
|
||||
if not os.path.isdir(filename):
|
||||
# read the file
|
||||
if filename != "warnings.txt":
|
||||
continue
|
||||
with z.open(filename) as f:
|
||||
for line in f:
|
||||
line = line.decode("UTF-8")
|
||||
if "warnings summary (final)" in line:
|
||||
continue
|
||||
# This means we are outside the body of a warning
|
||||
elif not line.startswith(" "):
|
||||
# process a single warning and move it to `selected_warnings`.
|
||||
if len(buffer) > 0:
|
||||
warning = "\n".join(buffer)
|
||||
# Only keep the warnings specified in `targets`
|
||||
if any(f": {x}: " in warning for x in targets):
|
||||
selected_warnings.add(warning)
|
||||
buffer = []
|
||||
continue
|
||||
else:
|
||||
line = line.strip()
|
||||
buffer.append(line)
|
||||
except Exception:
|
||||
logger.warning(
|
||||
f"{artifact_zip_path} is either an invalid zip file or something else wrong. This file is skipped."
|
||||
)
|
||||
def parse_line(fp):
|
||||
for line in fp:
|
||||
if isinstance(line, bytes):
|
||||
line = line.decode("UTF-8")
|
||||
if "warnings summary (final)" in line:
|
||||
continue
|
||||
# This means we are outside the body of a warning
|
||||
elif not line.startswith(" "):
|
||||
# process a single warning and move it to `selected_warnings`.
|
||||
if len(buffer) > 0:
|
||||
warning = "\n".join(buffer)
|
||||
# Only keep the warnings specified in `targets`
|
||||
if any(f": {x}: " in warning for x in targets):
|
||||
selected_warnings.add(warning)
|
||||
buffer.clear()
|
||||
continue
|
||||
else:
|
||||
line = line.strip()
|
||||
buffer.append(line)
|
||||
|
||||
if from_gh:
|
||||
for filename in os.listdir(artifact_path):
|
||||
file_path = os.path.join(artifact_path, filename)
|
||||
if not os.path.isdir(file_path):
|
||||
# read the file
|
||||
if filename != "warnings.txt":
|
||||
continue
|
||||
with open(file_path) as fp:
|
||||
parse_line(fp)
|
||||
else:
|
||||
try:
|
||||
with zipfile.ZipFile(artifact_path) as z:
|
||||
for filename in z.namelist():
|
||||
if not os.path.isdir(filename):
|
||||
# read the file
|
||||
if filename != "warnings.txt":
|
||||
continue
|
||||
with z.open(filename) as fp:
|
||||
parse_line(fp)
|
||||
except Exception:
|
||||
logger.warning(
|
||||
f"{artifact_path} is either an invalid zip file or something else wrong. This file is skipped."
|
||||
)
|
||||
|
||||
return selected_warnings
|
||||
|
||||
@@ -54,7 +68,7 @@ def extract_warnings(artifact_dir, targets):
|
||||
|
||||
selected_warnings = set()
|
||||
|
||||
paths = [os.path.join(artifact_dir, p) for p in os.listdir(artifact_dir) if p.endswith(".zip")]
|
||||
paths = [os.path.join(artifact_dir, p) for p in os.listdir(artifact_dir) if (p.endswith(".zip") or from_gh)]
|
||||
for p in paths:
|
||||
selected_warnings.update(extract_warnings_from_single_artifact(p, targets))
|
||||
|
||||
@@ -81,30 +95,41 @@ if __name__ == "__main__":
|
||||
parser.add_argument(
|
||||
"--token", default=None, type=str, required=True, help="A token that has actions:read permission."
|
||||
)
|
||||
# optional parameters
|
||||
parser.add_argument(
|
||||
"--targets",
|
||||
default="DeprecationWarning,UserWarning,FutureWarning",
|
||||
type=list_str,
|
||||
help="Comma-separated list of target warning(s) which we want to extract.",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--from_gh",
|
||||
action="store_true",
|
||||
help="If running from a GitHub action workflow and collecting warnings from its artifacts.",
|
||||
)
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
os.makedirs(args.output_dir, exist_ok=True)
|
||||
from_gh = args.from_gh
|
||||
if from_gh:
|
||||
# The artifacts have to be downloaded using `actions/download-artifact@v2`
|
||||
pass
|
||||
else:
|
||||
os.makedirs(args.output_dir, exist_ok=True)
|
||||
|
||||
# get download links
|
||||
artifacts = get_artifacts_links(args.workflow_run_id)
|
||||
with open(os.path.join(args.output_dir, "artifacts.json"), "w", encoding="UTF-8") as fp:
|
||||
json.dump(artifacts, fp, ensure_ascii=False, indent=4)
|
||||
# get download links
|
||||
artifacts = get_artifacts_links(args.workflow_run_id)
|
||||
with open(os.path.join(args.output_dir, "artifacts.json"), "w", encoding="UTF-8") as fp:
|
||||
json.dump(artifacts, fp, ensure_ascii=False, indent=4)
|
||||
|
||||
# download artifacts
|
||||
for idx, (name, url) in enumerate(artifacts.items()):
|
||||
print(name)
|
||||
print(url)
|
||||
print("=" * 80)
|
||||
download_artifact(name, url, args.output_dir, args.token)
|
||||
# Be gentle to GitHub
|
||||
time.sleep(1)
|
||||
# download artifacts
|
||||
for idx, (name, url) in enumerate(artifacts.items()):
|
||||
print(name)
|
||||
print(url)
|
||||
print("=" * 80)
|
||||
download_artifact(name, url, args.output_dir, args.token)
|
||||
# Be gentle to GitHub
|
||||
time.sleep(1)
|
||||
|
||||
# extract warnings from artifacts
|
||||
selected_warnings = extract_warnings(args.output_dir, args.targets)
|
||||
|
||||
Reference in New Issue
Block a user