From a5b92ee80186380eba06febb8fbf3059136eaa63 Mon Sep 17 00:00:00 2001 From: Christian Krinitsin Date: Tue, 3 Jun 2025 12:02:49 +0000 Subject: add option to parse all bugs --- classification/main.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) (limited to 'classification/main.py') diff --git a/classification/main.py b/classification/main.py index 3f16a281..ea472475 100755 --- a/classification/main.py +++ b/classification/main.py @@ -1,5 +1,10 @@ from transformers import pipeline from os import path, listdir, makedirs +from argparse import ArgumentParser + +parser = ArgumentParser(prog='main.py') +parser.add_argument('-m', '--minimal', action='store_true') +args = parser.parse_args() positive_categories = ['semantic', 'mistranslation', 'instruction', 'assembly'] # to add: register negative_categories = ['other', 'boot', 'network', 'KVM', 'vnc', 'graphic', 'device', 'socket'] # to add: performance @@ -30,7 +35,13 @@ def main(): classifier = pipeline("zero-shot-classification", model="facebook/bart-large-mnli") bugs = list_files_recursive("../results/scraper/mailinglist") - bugs = bugs + list_files_recursive("./semantic_issues") + if args.minimal: + bugs = bugs + list_files_recursive("./semantic_issues") + else: + bugs = bugs + list_files_recursive("../results/scraper/launchpad") + bugs = bugs + list_files_recursive("../results/scraper/gitlab/issues_text") + + print(f"{len(bugs)} number of bugs will be processed") for bug in bugs: print(f"Processing {bug}") with open(bug, "r") as file: -- cgit 1.4.1