Rewrite sarif-runner as full tool, sarif-extract-scans-runner

This commit is contained in:
Michael Hohn
2022-08-08 14:47:25 -07:00
committed by =Michael Hohn
parent 560b9ecf35
commit 7e996e746c
3 changed files with 217 additions and 77 deletions

View File

@@ -1,77 +0,0 @@
#!/usr/bin/env python3
import subprocess
import json
import os
import pickle
from datetime import datetime
#
# Collect sarif file information
#
paths = open('sarif-files.txt', 'r').readlines()
max_files = 80000
# Use saved status, only re-run failed attempts
if os.path.exists("successful_runs"):
with open("successful_runs", "rb") as infile:
successful_runs = pickle.load(infile)
else:
successful_runs = set()
count = 0
for path in paths:
count += 1
if count > max_files: break
#
# Paths and components
#
path = path.rstrip()
project, sarif_file = path.split('/')
component = sarif_file.removesuffix('.json')
#
# Scan specification
#
scan_spec = {
"project_id": abs(hash(project + component)),
"scan_id": int(os.path.getmtime(path)),
"sarif_file_name": path,
}
scan_spec_file = os.path.join(project, component + ".scanspec")
with open(scan_spec_file, 'w') as fp:
json.dump(scan_spec, fp)
#
# Table output directory
#
output_dir = os.path.join(project, component + ".scantables")
try: os.mkdir(output_dir, mode=0o755)
except FileExistsError: pass
#
# Run sarif-extract-scans
#
if path in successful_runs:
# Don't rerun
continue
# Some timing information
if count % 10 == 0:
print("{:6} {}".format("DATE", datetime.now().isoformat()))
# Save occasionally
if count % 10 == 0:
with open("successful_runs", 'wb') as outfile:
pickle.dump(successful_runs, outfile)
scan_log_file = os.path.join(project, component + ".scanlog")
runstats = subprocess.run(['sarif-extract-scans', scan_spec_file, output_dir],
capture_output=True, text=True)
if runstats.returncode == 0:
print("{:6} {}".format("OK", path))
successful_runs.add(path)
else:
print("{:6} {} {}".format("FAIL", path, scan_log_file))
# log error
with open(scan_log_file, 'w') as fp:
fp.write(runstats.stderr)
# report only tail
print("{:6} {}".format("", "Error tail: "))
for t1 in runstats.stderr.split('\n')[-6:-1]:
print("{:6} {}".format("", t1))

View File

@@ -5,5 +5,26 @@
#
( cd ../data/treeio/2021-12-09 && sarif-extract-tables results.sarif test-tables )
( cd ../data/treeio/2022-02-25 && sarif-extract-tables results.sarif test-tables )
( cd ../data/treeio && sarif-extract-multi multi-sarif-01.json test-multi-table )
( cd ../data/treeio && sarif-extract-scans scan-spec-0.json test-scan )
# Simple run
( cd ../data/treeio/ &&
sarif-extract-scans-runner - > /dev/null <<EOF
2021-12-09/results.sarif
2022-02-25/results.sarif
EOF
)
# Repeated run with state
( cd ../data/treeio/ &&
sarif-extract-scans-runner -i1 -s successful-runs - <<EOF
2021-12-09/results.sarif
2022-02-25/results.sarif
EOF
sarif-extract-scans-runner -i1 -s successful-runs - <<EOF
2021-12-09/results.sarif
2022-02-25/results.sarif
EOF
)