Timestamps in pyc files and zip archives were causing cache misses in RBE. Bug: b/322788229 Test: Ran a few local builds and verified improved cache hit rate for metalava actions. Change-Id: I9375694d26a107f5c0c43bbd685bd8e86349d187
72 lines
2.7 KiB
Python
72 lines
2.7 KiB
Python
#!/usr/bin/env python3
|
|
# Copyright 2023 Google Inc. All rights reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
import argparse
|
|
import py_compile
|
|
import os
|
|
import sys
|
|
import shutil
|
|
import tempfile
|
|
import zipfile
|
|
|
|
# This file needs to support both python 2 and 3.
|
|
|
|
|
|
def process_one_file(info, infile, outzip):
|
|
if not info.filename.endswith('.py'):
|
|
outzip.writestr(info, infile.read())
|
|
return
|
|
|
|
# Unfortunately py_compile requires the input/output files to be written
|
|
# out to disk.
|
|
with tempfile.NamedTemporaryFile(prefix="Soong_precompile_", delete=False) as tmp:
|
|
shutil.copyfileobj(infile, tmp)
|
|
in_name = tmp.name
|
|
with tempfile.NamedTemporaryFile(prefix="Soong_precompile_", delete=False) as tmp:
|
|
out_name = tmp.name
|
|
try:
|
|
# Ensure deterministic pyc by using the hash rather than timestamp.
|
|
# This is required to improve caching in accelerated builds.
|
|
# Only works on Python 3.7+ (see https://docs.python.org/3/library/py_compile.html#py_compile.PycInvalidationMode)
|
|
# which should cover most updated branches and developer machines.
|
|
if sys.version_info >= (3, 7):
|
|
py_compile.compile(in_name, out_name, info.filename, doraise=True, invalidation_mode=py_compile.PycInvalidationMode.CHECKED_HASH)
|
|
else:
|
|
py_compile.compile(in_name, out_name, info.filename, doraise=True)
|
|
with open(out_name, 'rb') as f:
|
|
info.filename = info.filename + 'c'
|
|
# Use ZipInfo rather than str to reuse timestamps for deterministic zip files.
|
|
outzip.writestr(info, f.read())
|
|
finally:
|
|
os.remove(in_name)
|
|
os.remove(out_name)
|
|
|
|
|
|
def main():
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument('src_zip')
|
|
parser.add_argument('dst_zip')
|
|
args = parser.parse_args()
|
|
|
|
with open(args.dst_zip, 'wb') as outf, open(args.src_zip, 'rb') as inf:
|
|
with zipfile.ZipFile(outf, mode='w') as outzip, zipfile.ZipFile(inf, mode='r') as inzip:
|
|
for info in inzip.infolist():
|
|
with inzip.open(info.filename, mode='r') as inzipf:
|
|
process_one_file(info, inzipf, outzip)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|