system and product image diff tool

This tool compares system and product image across models, and generate common.csv and diff.csv Here is example output - common.csv: filename, sha1sum, targets /system/a, da39a3ee5e, a;b;c - diff.csv: filename, sha1sum, targets /system/b, da39a3ee5e, a;b /system/c, 3f786850e3, a /system/c, 89e6c98d92, b;c Bug: 131273025 Test: m system_product_image_diff Test: system_product_image_diff -t model1 model2 -s system product Change-Id: Ie9cc368e0a6d26e956f1e27ebe683bea5e80465c
2019-06-13 18:19:30 +09:00
parent 3a5fc22f69
commit 062f2b09ca
3 changed files with 135 additions and 0 deletions
--- a/vndk/tools/image-diff-tool/diff.py
+++ b/vndk/tools/image-diff-tool/diff.py
@@ -0,0 +1,102 @@
+#
+# Copyright (C) 2019 The Android Open Source Project
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import subprocess
+import sys
+from collections import defaultdict
+from concurrent import futures
+from glob import glob
+from operator import itemgetter
+import hashlib
+import argparse
+
+tpe = futures.ThreadPoolExecutor()
+
+def strip_and_sha1sum(filepath):
+  def silent_call(cmd):
+    return subprocess.call(cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) == 0
+  objdump = lambda: silent_call(["objdump", "-a", filepath])
+  strip_all = lambda: silent_call(["llvm-strip", "--strip-all", "-keep-section=.ARM.attributes", filepath, "-o", filepath + ".tmp"])
+  remove_build_id = lambda: silent_call(["llvm-strip", "-remove-section=.note.gnu.build-id", filepath + ".tmp", "-o", filepath + ".tmp.no-build-id"])
+
+  def sha1sum(f):
+    with open(f, 'rb') as fin:
+      return hashlib.sha1(fin.read()).hexdigest()
+
+  if objdump():
+    try:
+      if strip_all() and remove_build_id():
+        return sha1sum(filepath + ".tmp.no-build-id")
+      else:
+        return sha1sum(filepath)
+    finally:
+      if os.path.exists(filepath + ".tmp"):
+        os.remove(filepath + ".tmp")
+      if os.path.exists(filepath + ".tmp.no-build-id"):
+        os.remove(filepath + ".tmp.no-build-id")
+  else:
+    return sha1sum(filepath)
+
+
+def main(targets, search_paths):
+  def get_target_name(path):
+    return os.path.basename(os.path.normpath(path))
+  artifact_target_map = defaultdict(list)
+  for target in targets:
+    def valid_path(p):
+      if os.path.isdir(p) or not os.path.exists(p):
+        return False
+      for s in search_paths:
+        if os.path.join(target, s).lower() + os.path.sep in p.lower():
+          return True
+      return False
+    paths = [path for path in glob(os.path.join(
+        target, "**", "*"), recursive=True) if valid_path(path)]
+
+    def run(path):
+      return strip_and_sha1sum(path), path[len(target):]
+    results = map(futures.Future.result, [tpe.submit(run, p) for p in paths])
+
+    for sha1, f in results:
+      basename = os.path.split(os.path.dirname(f))[1] + os.path.basename(f)
+      artifact_target_map[(sha1, basename)].append((get_target_name(target), f))
+
+  def pretty_print(p, ts):
+    assert(len({t for t, _ in ts}) == len(ts))
+    return ";".join({f for _, f in ts}) + ", " + p[0][:10] + ", " + ";".join(map(itemgetter(0), ts)) + "\n"
+  header = "filename, sha1sum, targets\n"
+  common = sorted([pretty_print(p, ts)
+                   for p, ts in artifact_target_map.items() if len(ts) == len(targets)])
+  diff = sorted([pretty_print(p, ts)
+                 for p, ts in artifact_target_map.items() if len(ts) < len(targets)])
+
+  with open("common.csv", 'w') as fout:
+    fout.write(header)
+    fout.writelines(common)
+  with open("diff.csv", 'w') as fout:
+    fout.write(header)
+    fout.writelines(diff)
+
+
+if __name__ == "__main__":
+  parser = argparse.ArgumentParser(prog="system_product_image_diff", usage="system_product_image_diff -t model1 model2 model3 -s system product")
+  parser.add_argument("-t", "--target", nargs='+', required=True)
+  parser.add_argument("-s", "--search_path", nargs='+', required=True)
+
+  args = parser.parse_args()
+  if len(args.target) < 2:
+    parser.error("The number of targets has to be at least two.")
+  main(args.target, args.search_path)