summary refs log tree commit diff stats
path: root/classification/tools/analyze_results.py
blob: 663c1f5590a8f989b75cf4df94e3bf33f9f27460 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
from argparse import ArgumentParser
from os import path, listdir

parser = ArgumentParser()

parser.add_argument('-b', '--bugs', required = True)
parser.add_argument('-d', '--search_directory', required = True)

args = parser.parse_args()

def list_files_recursive(directory, basename = False):
    result = []
    for entry in listdir(directory):
        full_path = path.join(directory, entry)
        if path.isdir(full_path):
            result = result + list_files_recursive(full_path, basename)
        else:
            if basename:
                result.append(path.basename(full_path))
            else:
                result.append(full_path)
    return result

def output_csv(dictionary, full_path):
    with open(path.join(full_path, 'analysis.csv'), "w") as file:
        file.write("category, count\n")
        for key, value in dictionary.items():
            file.write(f"{key}, {value}\n")

def main():
    result = {}
    mistranslation_bugs = list_files_recursive(args.bugs, True)
    bugs = list_files_recursive(args.search_directory, False)

    for mistranslation_bug in mistranslation_bugs:
        for bug in bugs:
            if mistranslation_bug == path.basename(bug):
                category = path.basename(path.dirname(bug))
                if category in result:
                    result[category] += 1
                else:
                    result[category] = 1
                continue

    output_csv(result, args.search_directory)

if __name__ == "__main__":
    main()