You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

58 lines
1.6 KiB

#!/usr/bin/env python3
# Copyright (c) 2017-present, Facebook, Inc.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.
import argparse
import json
def load_report(report_filename):
with open(report_filename, 'r') as file_in:
return json.load(file_in)
def compute_duplicates(report):
table = {}
for e in report:
bug_hash = e['hash']
if bug_hash in table:
table[bug_hash].append(e)
else:
table[bug_hash] = [e]
duplicates = []
for value in table.values():
if len(value) > 1:
duplicates += value
return duplicates
def save_duplicates(duplicates, output_filename):
duplicated_types = {}
for e in duplicates:
bug_type = e['bug_type']
if bug_type in duplicated_types:
duplicated_types[bug_type] += 1
else:
duplicated_types[bug_type] = 1
for bug_type, count in duplicated_types.items():
print('{} -> {}'.format(bug_type, count))
with open(output_filename, 'w') as file_out:
json.dump(duplicates, file_out, indent=2, separators=(',', ': '))
cli_parser = argparse.ArgumentParser()
cli_parser.add_argument('--report', type=str, required=True,
help='Infer report')
cli_parser.add_argument('--out', type=str, required=True,
help='Output list of duplicates (in JSON)')
if __name__ == '__main__':
args = cli_parser.parse_args()
report = load_report(args.report)
duplicates = compute_duplicates(report)
save_duplicates(duplicates, args.out)