inoki-giskard's picture
Use another process to run scan
60a5363
raw
history blame
2.97 kB
import argparse
from giskard_cicd.loaders import GithubLoader, HuggingFaceLoader
from giskard_cicd.pipeline.runner import PipelineRunner
from automation import create_discussion_detailed
if __name__ == "__main__":
parser = argparse.ArgumentParser(
prog="Giskard Scanner", description="Scans a model for vulnerabilities and produces a report."
)
parser.add_argument(
"--loader",
help="Which loader to use to set up the model. Currently only `github` and `huggingface` are supported.",
required=True,
)
parser.add_argument("--model", help="The model to scan.", required=True)
parser.add_argument("--dataset", help="The validation or test dataset that will be used.")
parser.add_argument(
"--dataset_split", help="The split of the dataset to use. If not provided, the best split will be selected."
)
parser.add_argument("--dataset_config", help="The name of the dataset config subset to use.")
parser.add_argument("--scan_config", help="Path to YAML file containing the configuration of the scan.")
parser.add_argument("--output", help="Optional name of the output file.")
parser.add_argument("--output_format", help="Format of the report (either HTML or markdown). Default is HTML.")
parser.add_argument("--output_portal", help="The output portal of the report (either huggingface or local directory). Default is local.")
parser.add_argument("--discussion_repo", help="The repo to push the report to.")
parser.add_argument("--hf_token", help="The token to push the report to the repo.")
args = parser.parse_args()
supported_loaders = {
"huggingface": HuggingFaceLoader(),
"github": GithubLoader(),
}
runner = PipelineRunner(loaders=supported_loaders)
runner_kwargs = {"loader_id": args.loader,
"model": args.model,
"dataset": args.dataset,
"scan_config": args.scan_config}
if args.loader == "huggingface":
runner_kwargs.update({"dataset_split": args.dataset_split,
"dataset_config": args.dataset_config})
report = runner.run(**runner_kwargs)
# In the future, write markdown report or directly push to discussion.
if args.output_format == "markdown":
rendered_report = report.to_markdown(template="github")
else:
rendered_report = report.to_html()
if args.output_portal == "huggingface":
# Push to discussion
create_discussion_detailed(args.discussion_repo, args.model, args.dataset, args.dataset_config, args.dataset_split, args.hf_token, rendered_report)
if args.output:
with open(args.output, "w") as f:
f.write(rendered_report)
else:
# To stdout
# print(rendered_report)
model_name = args.model.split("/")[-1]
with open(f"{model_name}_report.html", "w") as f:
f.write(rendered_report)