system and product image diff tool

This tool compares system and product image across models, and generate
common.csv and diff.csv

Here is example output
- common.csv:
filename, sha1sum, targets
/system/a, da39a3ee5e, a;b;c

- diff.csv:
filename, sha1sum, targets
/system/b, da39a3ee5e, a;b
/system/c, 3f786850e3, a
/system/c, 89e6c98d92, b;c

Bug: 131273025
Test: m system_product_image_diff
Test: system_product_image_diff -t model1 model2 -s system product

Change-Id: Ie9cc368e0a6d26e956f1e27ebe683bea5e80465c
This commit is contained in:
Jeongik Cha
2019-06-13 18:19:30 +09:00
parent 3a5fc22f69
commit 062f2b09ca
3 changed files with 135 additions and 0 deletions

View File

@@ -0,0 +1,102 @@
#
# Copyright (C) 2019 The Android Open Source Project
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import os
import subprocess
import sys
from collections import defaultdict
from concurrent import futures
from glob import glob
from operator import itemgetter
import hashlib
import argparse
tpe = futures.ThreadPoolExecutor()
def strip_and_sha1sum(filepath):
def silent_call(cmd):
return subprocess.call(cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) == 0
objdump = lambda: silent_call(["objdump", "-a", filepath])
strip_all = lambda: silent_call(["llvm-strip", "--strip-all", "-keep-section=.ARM.attributes", filepath, "-o", filepath + ".tmp"])
remove_build_id = lambda: silent_call(["llvm-strip", "-remove-section=.note.gnu.build-id", filepath + ".tmp", "-o", filepath + ".tmp.no-build-id"])
def sha1sum(f):
with open(f, 'rb') as fin:
return hashlib.sha1(fin.read()).hexdigest()
if objdump():
try:
if strip_all() and remove_build_id():
return sha1sum(filepath + ".tmp.no-build-id")
else:
return sha1sum(filepath)
finally:
if os.path.exists(filepath + ".tmp"):
os.remove(filepath + ".tmp")
if os.path.exists(filepath + ".tmp.no-build-id"):
os.remove(filepath + ".tmp.no-build-id")
else:
return sha1sum(filepath)
def main(targets, search_paths):
def get_target_name(path):
return os.path.basename(os.path.normpath(path))
artifact_target_map = defaultdict(list)
for target in targets:
def valid_path(p):
if os.path.isdir(p) or not os.path.exists(p):
return False
for s in search_paths:
if os.path.join(target, s).lower() + os.path.sep in p.lower():
return True
return False
paths = [path for path in glob(os.path.join(
target, "**", "*"), recursive=True) if valid_path(path)]
def run(path):
return strip_and_sha1sum(path), path[len(target):]
results = map(futures.Future.result, [tpe.submit(run, p) for p in paths])
for sha1, f in results:
basename = os.path.split(os.path.dirname(f))[1] + os.path.basename(f)
artifact_target_map[(sha1, basename)].append((get_target_name(target), f))
def pretty_print(p, ts):
assert(len({t for t, _ in ts}) == len(ts))
return ";".join({f for _, f in ts}) + ", " + p[0][:10] + ", " + ";".join(map(itemgetter(0), ts)) + "\n"
header = "filename, sha1sum, targets\n"
common = sorted([pretty_print(p, ts)
for p, ts in artifact_target_map.items() if len(ts) == len(targets)])
diff = sorted([pretty_print(p, ts)
for p, ts in artifact_target_map.items() if len(ts) < len(targets)])
with open("common.csv", 'w') as fout:
fout.write(header)
fout.writelines(common)
with open("diff.csv", 'w') as fout:
fout.write(header)
fout.writelines(diff)
if __name__ == "__main__":
parser = argparse.ArgumentParser(prog="system_product_image_diff", usage="system_product_image_diff -t model1 model2 model3 -s system product")
parser.add_argument("-t", "--target", nargs='+', required=True)
parser.add_argument("-s", "--search_path", nargs='+', required=True)
args = parser.parse_args()
if len(args.target) < 2:
parser.error("The number of targets has to be at least two.")
main(args.target, args.search_path)