2019-08-28 02:31:29 +08:00
|
|
|
#!/usr/bin/env python
|
2017-03-03 01:00:59 +08:00
|
|
|
|
|
|
|
from __future__ import print_function
|
|
|
|
|
|
|
|
desc = '''Generate the difference of two YAML files into a new YAML file (works on
|
|
|
|
pair of directories too). A new attribute 'Added' is set to True or False
|
|
|
|
depending whether the entry is added or removed from the first input to the
|
|
|
|
next.
|
|
|
|
|
|
|
|
The tools requires PyYAML.'''
|
|
|
|
|
|
|
|
import yaml
|
|
|
|
# Try to use the C parser.
|
|
|
|
try:
|
|
|
|
from yaml import CLoader as Loader
|
|
|
|
except ImportError:
|
|
|
|
from yaml import Loader
|
|
|
|
|
|
|
|
import optrecord
|
|
|
|
import argparse
|
|
|
|
from collections import defaultdict
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
parser = argparse.ArgumentParser(description=desc)
|
2017-07-18 02:00:41 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'yaml_dir_or_file_1',
|
|
|
|
help='An optimization record file or a directory searched for optimization '
|
|
|
|
'record files that are used as the old version for the comparison')
|
|
|
|
parser.add_argument(
|
|
|
|
'yaml_dir_or_file_2',
|
|
|
|
help='An optimization record file or a directory searched for optimization '
|
|
|
|
'record files that are used as the new version for the comparison')
|
2017-03-03 01:00:59 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'--jobs',
|
|
|
|
'-j',
|
2018-01-06 06:05:13 +08:00
|
|
|
default=None,
|
2017-03-03 01:00:59 +08:00
|
|
|
type=int,
|
2017-06-11 05:33:27 +08:00
|
|
|
help='Max job count (defaults to %(default)s, the current CPU count)')
|
2018-02-27 05:15:51 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'--max-size',
|
|
|
|
'-m',
|
|
|
|
default=100000,
|
|
|
|
type=int,
|
|
|
|
help='Maximum number of remarks stored in an output file')
|
2017-06-30 02:56:25 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'--no-progress-indicator',
|
|
|
|
'-n',
|
|
|
|
action='store_true',
|
|
|
|
default=False,
|
|
|
|
help='Do not display any indicator of how many YAML files were read.')
|
2018-02-27 05:15:51 +08:00
|
|
|
parser.add_argument('--output', '-o', default='diff{}.opt.yaml')
|
2017-03-03 01:00:59 +08:00
|
|
|
args = parser.parse_args()
|
|
|
|
|
2017-09-29 13:20:53 +08:00
|
|
|
files1 = optrecord.find_opt_files(args.yaml_dir_or_file_1)
|
|
|
|
files2 = optrecord.find_opt_files(args.yaml_dir_or_file_2)
|
2017-03-03 01:00:59 +08:00
|
|
|
|
2017-06-30 02:56:25 +08:00
|
|
|
print_progress = not args.no_progress_indicator
|
|
|
|
all_remarks1, _, _ = optrecord.gather_results(files1, args.jobs, print_progress)
|
|
|
|
all_remarks2, _, _ = optrecord.gather_results(files2, args.jobs, print_progress)
|
2017-03-03 01:00:59 +08:00
|
|
|
|
|
|
|
added = set(all_remarks2.values()) - set(all_remarks1.values())
|
|
|
|
removed = set(all_remarks1.values()) - set(all_remarks2.values())
|
|
|
|
|
|
|
|
for r in added:
|
|
|
|
r.Added = True
|
|
|
|
for r in removed:
|
|
|
|
r.Added = False
|
2017-07-20 06:04:59 +08:00
|
|
|
|
2018-02-27 05:15:51 +08:00
|
|
|
result = list(added | removed)
|
2017-07-20 06:04:59 +08:00
|
|
|
for r in result:
|
|
|
|
r.recover_yaml_structure()
|
|
|
|
|
2018-02-27 05:15:51 +08:00
|
|
|
for i in range(0, len(result), args.max_size):
|
|
|
|
with open(args.output.format(i / args.max_size), 'w') as stream:
|
|
|
|
yaml.dump_all(result[i:i + args.max_size], stream)
|