#!/usr/bin/env vpython3 # Copyright (c) 2011 The Chromium Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file.
"""Reports binary size metrics for an APK.
More information at //docs/speed/binary_size/metrics.md. """
from __future__ import print_function
import argparse import collections from contextlib import contextmanager import json import logging import os import posixpath import re import struct import sys import tempfile import zipfile import zlib
import devil_chromium from devil.android.sdk import build_tools from devil.utils import cmd_helper from devil.utils import lazy import method_count from pylib import constants from pylib.constants import host_paths
def DumpReports(self, report_func): for (graph_title, trace_title,
units), value in sorted(self._combined_metrics.items()):
report_func(graph_title, trace_title, value, units)
def SynthesizeTotals(self, unique_method_count): for tup, value in sorted(self._combined_metrics.items()):
graph_title, trace_title, units = tup if trace_title == 'unique methods':
value = unique_method_count
perf_tests_results_helper.ReportPerfResult(self._chartjson, graph_title, 'Combined_' + trace_title,
value, units)
def _PercentageDifference(a, b): if a == 0: return 0 return float(b - a) / a
def _ReadZipInfoExtraFieldLength(zip_file, zip_info): """Reads the value of |extraLength| from |zip_info|'s local file header.
|zip_info| has an |extra| field, but it's read from the central directory.
Android's zipalign tool sets the extra field only in local file headers. """ # Refer to https://en.wikipedia.org/wiki/Zip_(file_format)#File_headers
zip_file.fp.seek(zip_info.header_offset + 28) return struct.unpack(', zip_file.fp.read(2))[0]
def _MeasureApkSignatureBlock(zip_file): """Measures the size of the v2 / v3 signing block.
Refer to: https://source.android.com/security/apksigning/v2 """ # Seek to "end of central directory" struct.
eocd_offset_from_end = -22 - len(zip_file.comment)
zip_file.fp.seek(eocd_offset_from_end, os.SEEK_END) assert zip_file.fp.read(4) == b'PK\005\006', ( 'failed to find end-of-central-directory')
# Read out the "start of central directory" offset.
zip_file.fp.seek(eocd_offset_from_end + 16, os.SEEK_END)
start_of_central_directory = struct.unpack(', zip_file.fp.read(4))[0]
# Compute the offset after the last zip entry.
last_info = max(zip_file.infolist(), key=lambda i: i.header_offset)
last_header_size = (30 + len(last_info.filename) +
_ReadZipInfoExtraFieldLength(zip_file, last_info))
end_of_last_file = (last_info.header_offset + last_header_size +
last_info.compress_size) return start_of_central_directory - end_of_last_file
def _ExtractLibSectionSizesFromApk(apk_path, lib_path, tool_prefix): with Unzip(apk_path, filename=lib_path) as extracted_lib_path:
grouped_section_sizes = collections.defaultdict(int)
no_bits_section_sizes, section_sizes = _CreateSectionNameSizeMap(
extracted_lib_path, tool_prefix) for group_name, section_names in _READELF_SIZES_METRICS.items(): for section_name in section_names: if section_name in section_sizes:
grouped_section_sizes[group_name] += section_sizes.pop(section_name)
# Consider all NOBITS sections as .bss.
grouped_section_sizes['bss'] = sum(no_bits_section_sizes.values())
# Group any unknown section headers into the "other" group. for section_header, section_size in section_sizes.items():
sys.stderr.write('Unknown elf section header: %s\n' % section_header)
grouped_section_sizes['other'] += section_size
def _ParseManifestAttributes(apk_path): # Check if the manifest specifies whether or not to extract native libs.
output = cmd_helper.GetCmdOutput([
_AAPT_PATH.read(), 'd', 'xmltree', apk_path, 'AndroidManifest.xml'])
def parse_attr(name): # android:extractNativeLibs(0x010104ea)=(type 0x12)0x0 # android:extractNativeLibs(0x010104ea)=(type 0x12)0xffffffff # dist:onDemand=(type 0x12)0xffffffff
m = re.search(name + r'(?:\(.*?\))?=\(type .*?\)(\w+)', output) return m and int(m.group(1), 16)
skip_extract_lib = bool(parse_attr('android:extractNativeLibs'))
sdk_version = parse_attr('android:minSdkVersion')
is_feature_split = parse_attr('android:isFeatureSplit') # Can use <dist:on-demand>, or <module dist:onDemand="true">.
on_demand = parse_attr('dist:onDemand') or'dist:on-demand'in output
on_demand = bool(on_demand and is_feature_split)
return sdk_version, skip_extract_lib, on_demand
def _NormalizeLanguagePaks(translations, factor):
english_pak = translations.FindByPattern(r'.*/en[-_][Uu][Ss]\.l?pak')
num_translations = translations.GetNumEntries()
ret = 0 if english_pak:
ret -= translations.ComputeZippedSize()
ret += int(english_pak.compress_size * num_translations * factor) return ret
def _NormalizeResourcesArsc(apk_path, num_arsc_files, num_translations,
out_dir): """Estimates the expected overhead of untranslated strings in resources.arsc.
See http://crbug.com/677966for why this is necessary. """ # If there are multiple .arsc files, use the resource packaged APK instead. if num_arsc_files > 1: ifnot out_dir: return -float('inf')
ap_name = os.path.basename(apk_path).replace('.apk', '.ap_')
ap_path = os.path.join(out_dir, 'arsc/apks', ap_name) ifnot os.path.exists(ap_path): raise Exception('Missing expected file: %s, try rebuilding.' % ap_path)
apk_path = ap_path
aapt_output = _RunAaptDumpResources(apk_path) # en-rUS is in the default config and may be cluttered with non-translatable # strings, so en-rGB is a better baseline for finding missing translations.
en_strings = _CreateResourceIdValueMap(aapt_output, 'en-rGB')
fr_strings = _CreateResourceIdValueMap(aapt_output, 'fr')
# en-US and en-GB will never be translated.
config_count = num_translations - 2
size = 0 for res_id, string_val in en_strings.items(): if string_val == fr_strings[res_id]:
string_size = len(string_val) # 7 bytes is the per-entry overhead (not specific to any string). See # https://android.googlesource.com/platform/frameworks/base.git/+/android-4.2.2_r1/tools/aapt/StringPool.cpp#414. # The 1.5 factor was determined experimentally and is meant to account for # other languages generally having longer strings than english.
size += config_count * (7 + string_size * 1.5)
return int(size)
def _CreateResourceIdValueMap(aapt_output, lang): """Return a map of resource ids to string values for the given |lang|."""
config_re = _AAPT_CONFIG_PATTERN % lang return {entry.group('id'): entry.group('val') for config_section in re.finditer(config_re, aapt_output, re.DOTALL) for entry in re.finditer(_AAPT_ENTRY_RE, config_section.group(0))}
def ComputeZippedSize(self): return sum(i.compress_size for i in self._zip_infos)
def ComputeUncompressedSize(self): return sum(i.file_size for i in self._zip_infos)
def ComputeExtractedSize(self):
ret = 0 for zi, multiplier in zip(self._zip_infos, self._extracted_multipliers):
ret += zi.file_size * multiplier return ret
with zipfile.ZipFile(apk_path, 'r') as apk:
apk_contents = apk.infolist() # Account for zipalign overhead that exists in local file header.
zipalign_overhead = sum(
_ReadZipInfoExtraFieldLength(apk, i) for i in apk_contents) # Account for zipalign overhead that exists in central directory header. # Happens when python aligns entries in apkbuilder.py, but does not # exist when using Android's zipalign. E.g. for bundle .apks files.
zipalign_overhead += sum(len(i.extra) for i in apk_contents)
signing_block_size = _MeasureApkSignatureBlock(apk)
# Pre-L: Dalvik - .odex file is simply decompressed/optimized dex file (~1x). # L, M: ART - .odex file is compiled version of the dex file (~4x). # N: ART - Uses Dalvik-like JIT for normal apps (~1x), full compilation for # shared apps (~4x). # Actual multipliers calculated using "apk_operations.py disk-usage". # Will need to update multipliers once apk obfuscation is enabled. # E.g. with obfuscation, the 4.04 changes to 4.46.
speed_profile_dex_multiplier = 1.17
orig_filename = apks_path or apk_path
is_webview = 'WebView'in orig_filename
is_monochrome = 'Monochrome'in orig_filename
is_library = 'Library'in orig_filename
is_shared_apk = sdk_version >= 24 and (is_monochrome or is_webview or is_library) # Dex decompression overhead varies by Android version. if sdk_version < 21: # JellyBean & KitKat
dex_multiplier = 1.16 elif sdk_version < 24: # Lollipop & Marshmallow
dex_multiplier = 4.04 elif is_shared_apk: # Oreo and above, compilation_filter=speed
dex_multiplier = 4.04 else: # Oreo and above, compilation_filter=speed-profile
dex_multiplier = speed_profile_dex_multiplier
total_apk_size = os.path.getsize(apk_path) for member in apk_contents:
filename = member.filename if filename.endswith('/'): continue if filename.endswith('.so'):
basename = posixpath.basename(filename)
should_extract_lib = not skip_extract_lib and basename.startswith('lib')
native_code.AddZipInfo(
member, extracted_multiplier=int(should_extract_lib)) elif filename.endswith('.dex'):
java_code.AddZipInfo(member, extracted_multiplier=dex_multiplier) elif re.search(_RE_NON_LANGUAGE_PAK, filename):
native_resources_no_translations.AddZipInfo(member) elif filename.endswith('.pak') or filename.endswith('.lpak'):
compressed = member.compress_type != zipfile.ZIP_STORED
bucket = translations if compressed else stored_translations
extracted_multiplier = 0 if compressed:
extracted_multiplier = int('en_'in filename or'en-'in filename)
bucket.AddZipInfo(member, extracted_multiplier=extracted_multiplier) elif'icu'in filename and filename.endswith('.dat'):
icu_data.AddZipInfo(member) elif filename.endswith('.bin'):
v8_snapshots.AddZipInfo(member) elif filename.startswith('res/'): if (filename.endswith('.png') or filename.endswith('.webp') or has_no_extension(filename)):
png_drawables.AddZipInfo(member) else:
res_directory.AddZipInfo(member) elif filename.endswith('.arsc'):
arsc.AddZipInfo(member) elif filename.startswith('META-INF') or filename in ( 'AndroidManifest.xml', 'assets/webapk_dex_version.txt'):
metadata.AddZipInfo(member) elif filename.endswith('.notice'):
notices.AddZipInfo(member) elif filename.startswith('assets/unwind_cfi'):
unwind_cfi.AddZipInfo(member) else:
unknown.AddZipInfo(member)
if apks_path: # We're mostly focused on size of Chrome for non-English locales, so assume # Hindi (arbitrarily chosen) locale split is installed. with zipfile.ZipFile(apks_path) as z:
subpath = 'splits/{}-hi.apk'.format(split_name) if subpath in z.namelist():
hindi_apk_info = z.getinfo(subpath)
total_apk_size += hindi_apk_info.file_size else: assert split_name != 'base', 'splits/base-hi.apk should always exist'
for group in file_groups:
actual_size = group.ComputeZippedSize()
install_size = group.ComputeInstallSize()
uncompressed_size = group.ComputeUncompressedSize()
extracted_size = group.ComputeExtractedSize()
total_install_size += extracted_size
zip_overhead -= actual_size
report_func('Breakdown', group.name + ' size', actual_size, 'bytes')
report_func('InstallBreakdown', group.name + ' size', int(install_size), 'bytes') # Only a few metrics are compressed in the first place. # To avoid over-reporting, track uncompressed size only for compressed # entries. if uncompressed_size != actual_size:
report_func('Uncompressed', group.name + ' size', uncompressed_size, 'bytes')
if group is java_code and is_shared_apk: # Updates are compiled using quicken, but system image uses speed-profile.
extracted_size = int(uncompressed_size * speed_profile_dex_multiplier)
total_install_size_android_go += extracted_size
report_func('InstallBreakdownGo', group.name + ' size',
actual_size + extracted_size, 'bytes') elif group is translations and apks_path: # Assume Hindi rather than English (accounted for above in total_apk_size)
total_install_size_android_go += actual_size else:
total_install_size_android_go += extracted_size
# Size of main dex vs remaining.
main_dex_info = java_code.FindByPattern('classes.dex') if main_dex_info:
main_dex_size = main_dex_info.file_size
report_func('Specifics', 'main dex size', main_dex_size, 'bytes')
secondary_size = java_code.ComputeUncompressedSize() - main_dex_size
report_func('Specifics', 'secondary dex size', secondary_size, 'bytes')
main_lib_info = native_code.FindLargest()
native_code_unaligned_size = 0 for lib_info in native_code.AllEntries():
section_sizes = _ExtractLibSectionSizesFromApk(apk_path, lib_info.filename,
tool_prefix)
native_code_unaligned_size += sum(v for k, v in section_sizes.items() if k != 'bss') # Size of main .so vs remaining. if lib_info == main_lib_info:
main_lib_size = lib_info.file_size
report_func('Specifics', 'main lib size', main_lib_size, 'bytes')
secondary_size = native_code.ComputeUncompressedSize() - main_lib_size
report_func('Specifics', 'other lib size', secondary_size, 'bytes')
for metric_name, size in section_sizes.items():
report_func('MainLibInfo', metric_name, size, 'bytes')
# Main metric that we want to monitor for jumps.
normalized_apk_size = total_apk_size # unwind_cfi exists only in dev, canary, and non-channel builds.
normalized_apk_size -= unwind_cfi.ComputeZippedSize() # Sections within .so files get 4kb aligned, so use section sizes rather than # file size. Also gets rid of compression.
normalized_apk_size -= native_code.ComputeZippedSize()
normalized_apk_size += native_code_unaligned_size # Normalized dex size: Size within the zip + size on disk for Android Go # devices running Android O (which ~= uncompressed dex size). # Use a constant compression factor to account for fluctuations.
normalized_apk_size -= java_code.ComputeZippedSize()
normalized_apk_size += java_code.ComputeUncompressedSize() # Don't include zipalign overhead in normalized size, since it effectively # causes size changes files that proceed aligned files to be rounded. # For APKs where classes.dex directly proceeds libchrome.so (the normal case), # this causes small dex size changes to disappear into libchrome.so alignment.
normalized_apk_size -= zipalign_overhead # Don't include the size of the apk's signing block because it can fluctuate # by up to 4kb (from my non-scientific observations), presumably based on hash # sizes.
normalized_apk_size -= signing_block_size
# Unaligned size should be ~= uncompressed size or something is wrong. # As of now, padding_fraction ~= .007
padding_fraction = -_PercentageDifference(
native_code.ComputeUncompressedSize(), native_code_unaligned_size) # Ignore this check for small / no native code if native_code.ComputeUncompressedSize() > 1000000: assert 0 <= padding_fraction < .02, ( 'Padding was: {} (file_size={}, sections_sum={})'.format(
padding_fraction, native_code.ComputeUncompressedSize(),
native_code_unaligned_size))
if apks_path: # Locale normalization not needed when measuring only one locale. # E.g. a change that adds 300 chars of unstranslated strings would cause the # metric to be off by only 390 bytes (assuming a multiplier of 2.3 for # Hindi). pass else: # Avoid noise caused when strings change and translations haven't yet been # updated.
num_translations = translations.GetNumEntries()
num_stored_translations = stored_translations.GetNumEntries()
if num_translations > 1: # Multipliers found by looking at MonochromePublic.apk and seeing how much # smaller en-US.pak is relative to the average locale.pak.
normalized_apk_size += _NormalizeLanguagePaks(translations, 1.17) if num_stored_translations > 1:
normalized_apk_size += _NormalizeLanguagePaks(stored_translations, 1.43) if num_translations + num_stored_translations > 1: if num_translations == 0: # WebView stores all locale paks uncompressed.
num_arsc_translations = num_stored_translations else: # Monochrome has more configurations than Chrome since it includes # WebView (which supports more locales), but these should mostly be # empty so ignore them here.
num_arsc_translations = num_translations
normalized_apk_size += _NormalizeResourcesArsc(apk_path,
arsc.GetNumEntries(),
num_arsc_translations,
out_dir)
# It will be -Inf for .apk files with multiple .arsc files and no out_dir set. if normalized_apk_size < 0:
sys.stderr.write('Skipping normalized_apk_size (no output directory set)\n') else:
report_func('Specifics', 'normalized apk size', normalized_apk_size, 'bytes') # The "file count" metric cannot be grouped with any other metrics when the # end result is going to be uploaded to the perf dashboard in the HistogramSet # format due to mixed units (bytes vs. zip entries) causing malformed # summaries to be generated. # TODO(https://crbug.com/903970): Remove this workaround if unit mixing is # ever supported.
report_func('FileCount', 'file count', len(apk_contents), 'zip entries')
for info in unknown.AllEntries():
sys.stderr.write( 'Unknown entry: %s %d\n' % (info.filename, info.compress_size)) return normalized_apk_size
def _CalculateCompressedSize(file_path):
CHUNK_SIZE = 256 * 1024
compressor = zlib.compressobj()
total_size = 0 with open(file_path, 'rb') as f: for chunk in iter(lambda: f.read(CHUNK_SIZE), b''):
total_size += len(compressor.compress(chunk))
total_size += len(compressor.flush()) return total_size
@contextmanager def Unzip(zip_file, filename=None): """Utility for temporary use of a single file in a zip archive.""" with build_utils.TempDir() as unzipped_dir:
unzipped_files = build_utils.ExtractAll(
zip_file, unzipped_dir, True, pattern=filename) if len(unzipped_files) == 0: raise Exception( '%s not found in %s' % (filename, zip_file)) yield unzipped_files[0]
def _AnalyzeApkOrApks(report_func, apk_path, args): # Create DexStatsCollector here to track unique methods across base & chrome # modules.
dex_stats_collector = method_count.DexStatsCollector()
out_dir, tool_prefix = _ConfigOutDirAndToolsPrefix(args.out_dir)
if apk_path.endswith('.apk'):
sdk_version, _, _ = _ParseManifestAttributes(apk_path)
_AnalyzeInternal(apk_path, sdk_version, report_func, dex_stats_collector,
out_dir, tool_prefix) elif apk_path.endswith('.apks'): with tempfile.NamedTemporaryFile(suffix='.apk') as f: with zipfile.ZipFile(apk_path) as z: # Currently bundletool is creating two apks when .apks is created # without specifying an sdkVersion. Always measure the one with an # uncompressed shared library. try:
info = z.getinfo('splits/base-master_2.apk') except KeyError:
info = z.getinfo('splits/base-master.apk')
_ExtractToTempFile(z, info.filename, f)
sdk_version, _, _ = _ParseManifestAttributes(f.name)
# Report dex stats outside of _AnalyzeInternal() so that the "unique methods" # metric is not just the sum of the base and chrome modules. for metric, count in dex_stats_collector.GetTotalCounts().items():
report_func('Dex', metric, count, 'entries')
report_func('Dex', 'unique methods',
dex_stats_collector.GetUniqueMethodCount(), 'entries')
report_func('DexCache', 'DexCache',
dex_stats_collector.GetDexCacheSize(pre_oreo=sdk_version < 26), 'bytes')
return dex_stats_collector
def _ResourceSizes(args):
chartjson = _BASE_CHART.copy() if args.output_format elseNone
reporter = _ChartJsonReporter(chartjson) # Create DexStatsCollector here to track unique methods across trichrome APKs.
dex_stats_collector = method_count.DexStatsCollector()
specs = [
('Chrome_', args.trichrome_chrome),
('WebView_', args.trichrome_webview),
('Library_', args.trichrome_library),
] for prefix, path in specs: if path:
reporter.trace_title_prefix = prefix
child_dex_stats_collector = _AnalyzeApkOrApks(reporter, path, args)
dex_stats_collector.MergeFrom(prefix, child_dex_stats_collector)
if any(path for _, path in specs):
reporter.SynthesizeTotals(dex_stats_collector.GetUniqueMethodCount()) else:
_AnalyzeApkOrApks(reporter, args.input, args)
# We would ideally generate a histogram set directly instead of generating # chartjson then converting. However, perf_tests_results_helper is in # //build, which doesn't seem to have any precedent for depending on # anything in Catapult. This can probably be fixed, but since this doesn't # need to be super fast or anything, converting is a good enough solution # for the time being. if args.output_format == 'histograms':
histogram_result = convert_chart_json.ConvertChartJson(results_path) if histogram_result.returncode != 0: raise Exception('chartjson conversion failed with error: ' +
histogram_result.stdout)
histogram_path = os.path.join(args.output_dir, 'perf_results.json')
logging.critical('Dumping histograms to %s', histogram_path) with open(histogram_path, 'w') as json_file:
json_file.write(histogram_result.stdout)
def main():
build_utils.InitLogging('RESOURCE_SIZES_DEBUG')
argparser = argparse.ArgumentParser(description='Print APK size metrics.')
argparser.add_argument( '--min-pak-resource-size',
type=int,
default=20 * 1024,
help='Minimum byte size of displayed pak resources.')
argparser.add_argument( '--chromium-output-directory',
dest='out_dir',
type=os.path.realpath,
help='Location of the build artifacts.')
argparser.add_argument( '--chartjson',
action='store_true',
help='DEPRECATED. Use --output-format=chartjson ' 'instead.')
argparser.add_argument( '--output-format',
choices=['chartjson', 'histograms'],
help='Output the results to a file in the given ' 'format instead of printing the results.')
argparser.add_argument('--loadable_module', help='Obsolete (ignored).')
# Accepted to conform to the isolated script interface, but ignored.
argparser.add_argument( '--isolated-script-test-filter', help=argparse.SUPPRESS)
argparser.add_argument( '--isolated-script-test-perf-output',
type=os.path.realpath,
help=argparse.SUPPRESS)
output_group.add_argument( '--output-dir', default='.', help='Directory to save chartjson to.')
output_group.add_argument( '--output-file',
help='Path to output .json (replaces --output-dir). Works only for ' '--output-format=chartjson')
output_group.add_argument( '--isolated-script-test-output',
type=os.path.realpath,
help='File to which results will be written in the ' 'simplified JSON output format.')
argparser.add_argument('input', help='Path to .apk or .apks file to measure.')
trichrome_group = argparser.add_argument_group( 'Trichrome inputs',
description='When specified, |input| is used only as Test suite name.')
trichrome_group.add_argument( '--trichrome-chrome', help='Path to Trichrome Chrome .apks')
trichrome_group.add_argument( '--trichrome-webview', help='Path to Trichrome WebView .apk(s)')
trichrome_group.add_argument( '--trichrome-library', help='Path to Trichrome Library .apk')
args = argparser.parse_args()
Die Informationen auf dieser Webseite wurden
nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit,
noch Qualität der bereit gestellten Informationen zugesichert.
Bemerkung:
Die farbliche Syntaxdarstellung und die Messung sind noch experimentell.