[tbb-commits] [Git][tpo/applications/tor-browser-build][main] Bug 40920: Non-deterministic generation of baseline.profm file in Android apks
richard (@richard)
git at gitlab.torproject.org
Fri Aug 11 18:25:52 UTC 2023
richard pushed to branch main at The Tor Project / Applications / tor-browser-build
e49c2819 by Richard Pospesel at 2023-08-11T18:13:49+00:00
Bug 40920: Non-deterministic generation of baseline.profm file in Android apks
- - - - -
3 changed files:
- projects/browser/build.android
- projects/browser/config
- + projects/browser/sort-baseline.py
@@ -9,6 +9,11 @@ ext_dir=$assets_dir/extensions
qa_apk=[% dest_dir %]/[% c('filename') %]/[% c("var/project-name") %]-[% c("version") %]-[% c("var/osname") %]-multi-qa.apk
apk=$rootdir/firefox-android/*-[% c("var/abi") %]-*.apk
+# tor-browser-build#40920
+sorted_baseline_apk=$(basename $apk .apk)_sorted_baseline.apk
+$rootdir/sort-baseline.py --apk $apk $sorted_baseline_apk
+mv $sorted_baseline_apk $apk
# Bundle our extensioni(s).
# NoScript will be copied over to the profile folder
# as a "regular" browser extension receiving regular AMO updates.
@@ -151,3 +151,6 @@ input_files:
- project: manual
name: manual
enable: '[% ! c("var/android") && c("var/tor-browser") %]'
+ # tor-browser-build#40920
+ - filename: sort-baseline.py
+ enable: '[% c("var/android") %]'
@@ -0,0 +1,185 @@
+# encoding: utf-8
+# SPDX-FileCopyrightText: 2023 FC Stegerman <flx at obfusk.net>
+# SPDX-License-Identifier: GPL-3.0-or-later
+import struct
+import zipfile
+import zlib
+from typing import Any, Dict, Tuple
+# https://android.googlesource.com/platform/tools/base
+# profgen/profgen/src/main/kotlin/com/android/tools/profgen/ArtProfileSerializer.kt
+PROF_MAGIC = b"pro\x00"
+PROFM_MAGIC = b"prm\x00"
+PROF_001_N = b"001\x00"
+PROF_005_O = b"005\x00"
+PROF_009_O_MR1 = b"009\x00"
+PROF_010_P = b"010\x00"
+PROF_015_S = b"015\x00"
+PROFM_001_N = b"001\x00"
+PROFM_002 = b"002\x00"
+ASSET_PROF = "assets/dexopt/baseline.prof"
+ASSET_PROFM = "assets/dexopt/baseline.profm"
+ATTRS = ("compress_type", "create_system", "create_version", "date_time",
+ "external_attr", "extract_version", "flag_bits")
+LEVELS = (9, 6, 4, 1)
+class Error(RuntimeError):
+ pass
+# FIXME: is there a better alternative?
+class ReproducibleZipInfo(zipfile.ZipInfo):
+ """Reproducible ZipInfo hack."""
+ if "_compresslevel" not in zipfile.ZipInfo.__slots__: # type: ignore[attr-defined]
+ raise Error("zipfile.ZipInfo has no ._compresslevel")
+ _compresslevel: int
+ _override: Dict[str, Any] = {}
+ def __init__(self, zinfo: zipfile.ZipInfo, **override: Any) -> None:
+ # pylint: disable=W0231
+ if override:
+ self._override = {**self._override, **override}
+ for k in self.__slots__:
+ if hasattr(zinfo, k):
+ setattr(self, k, getattr(zinfo, k))
+ def __getattribute__(self, name: str) -> Any:
+ if name != "_override":
+ try:
+ return self._override[name]
+ except KeyError:
+ pass
+ return object.__getattribute__(self, name)
+def sort_baseline(input_file: str, output_file: str) -> None:
+ with open(input_file, "rb") as fhi:
+ data = _sort_baseline(fhi.read())
+ with open(output_file, "wb") as fho:
+ fho.write(data)
+def sort_baseline_apk(input_apk: str, output_apk: str) -> None:
+ with open(input_apk, "rb") as fh_raw:
+ with zipfile.ZipFile(input_apk) as zf_in:
+ with zipfile.ZipFile(output_apk, "w") as zf_out:
+ for info in zf_in.infolist():
+ attrs = {attr: getattr(info, attr) for attr in ATTRS}
+ zinfo = ReproducibleZipInfo(info, **attrs)
+ if info.compress_type == 8:
+ fh_raw.seek(info.header_offset)
+ n, m = struct.unpack("<HH", fh_raw.read(30)[26:30])
+ fh_raw.seek(info.header_offset + 30 + m + n)
+ ccrc = 0
+ size = info.compress_size
+ while size > 0:
+ ccrc = zlib.crc32(fh_raw.read(min(size, 4096)), ccrc)
+ size -= 4096
+ with zf_in.open(info) as fh_in:
+ comps = {lvl: zlib.compressobj(lvl, 8, -15) for lvl in LEVELS}
+ ccrcs = {lvl: 0 for lvl in LEVELS}
+ while True:
+ data = fh_in.read(4096)
+ if not data:
+ break
+ for lvl in LEVELS:
+ ccrcs[lvl] = zlib.crc32(comps[lvl].compress(data), ccrcs[lvl])
+ for lvl in LEVELS:
+ if ccrc == zlib.crc32(comps[lvl].flush(), ccrcs[lvl]):
+ zinfo._compresslevel = lvl
+ break
+ else:
+ raise Error(f"Unable to determine compresslevel for {info.filename!r}")
+ elif info.compress_type != 0:
+ raise Error(f"Unsupported compress_type {info.compress_type}")
+ if info.filename == ASSET_PROFM:
+ print(f"replacing {info.filename!r}...")
+ zf_out.writestr(zinfo, _sort_baseline(zf_in.read(info)))
+ else:
+ with zf_in.open(info) as fh_in:
+ with zf_out.open(zinfo, "w") as fh_out:
+ while True:
+ data = fh_in.read(4096)
+ if not data:
+ break
+ fh_out.write(data)
+# Supported .prof: none
+# Supported .profm: 002
+# Unsupported .profm: 001 N
+def _sort_baseline(data: bytes) -> bytes:
+ magic, data = _split(data, 4)
+ version, data = _split(data, 4)
+ if magic == PROF_MAGIC:
+ raise Error(f"Unsupported prof version {version!r}")
+ elif magic == PROFM_MAGIC:
+ if version == PROFM_002:
+ return PROFM_MAGIC + PROFM_002 + sort_profm_002(data)
+ else:
+ raise Error(f"Unsupported profm version {version!r}")
+ else:
+ raise Error(f"Unsupported magic {magic!r}")
+def sort_profm_002(data: bytes) -> bytes:
+ num_dex_files, uncompressed_data_size, compressed_data_size, data = _unpack("<HII", data)
+ profiles = []
+ if len(data) != compressed_data_size:
+ raise Error("Compressed data size does not match")
+ data = zlib.decompress(data)
+ if len(data) != uncompressed_data_size:
+ raise Error("Uncompressed data size does not match")
+ for _ in range(num_dex_files):
+ profile = data[:4]
+ profile_idx, profile_key_size, data = _unpack("<HH", data)
+ profile_key, data = _split(data, profile_key_size)
+ profile += profile_key + data[:6]
+ num_type_ids, num_class_ids, data = _unpack("<IH", data)
+ class_ids, data = _split(data, num_class_ids * 2)
+ profile += class_ids
+ profiles.append((profile_key, profile))
+ if data:
+ raise Error("Expected end of data")
+ srtd = b"".join(int.to_bytes(i, 2, "little") + p[1][2:]
+ for i, p in enumerate(sorted(profiles)))
+ cdata = zlib.compress(srtd, 1)
+ hdr = struct.pack("<HII", num_dex_files, uncompressed_data_size, len(cdata))
+ return hdr + cdata
+def _unpack(fmt: str, data: bytes) -> Any:
+ assert all(c in "<BHI" for c in fmt)
+ size = fmt.count("B") + 2 * fmt.count("H") + 4 * fmt.count("I")
+ return struct.unpack(fmt, data[:size]) + (data[size:],)
+def _split(data: bytes, size: int) -> Tuple[bytes, bytes]:
+ return data[:size], data[size:]
+if __name__ == "__main__":
+ import argparse
+ parser = argparse.ArgumentParser(prog="sort-baseline.py")
+ parser.add_argument("--apk", action="store_true")
+ parser.add_argument("input_prof_or_apk", metavar="INPUT_PROF_OR_APK")
+ parser.add_argument("output_prof_or_apk", metavar="OUTPUT_PROF_OR_APK")
+ args = parser.parse_args()
+ if args.apk:
+ sort_baseline_apk(args.input_prof_or_apk, args.output_prof_or_apk)
+ else:
+ sort_baseline(args.input_prof_or_apk, args.output_prof_or_apk)
+# vim: set tw=80 sw=4 sts=4 et fdm=marker :
View it on GitLab: https://gitlab.torproject.org/tpo/applications/tor-browser-build/-/commit/e49c281950e988f0f882fddc64db5ee431e526df
View it on GitLab: https://gitlab.torproject.org/tpo/applications/tor-browser-build/-/commit/e49c281950e988f0f882fddc64db5ee431e526df
You're receiving this email because of your account on gitlab.torproject.org.
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://lists.torproject.org/pipermail/tbb-commits/attachments/20230811/7d92423d/attachment-0001.htm>
More information about the tbb-commits
mailing list