tools/makeqstrdefs.py: Run qstr preprocessing in parallel.

This gives a substantial speedup of the preprocessing step, i.e. the
generation of qstr.i.last.  For example on a clean build, making
qstr.i.last:

    21s -> 4s on STM32 (WB55)
    8.9 -> 1.8s on Unix (dev).

Done in collaboration with @stinos.

Signed-off-by: Jim Mussared <jim.mussared@gmail.com>
This commit is contained in:
Jim Mussared 2020-10-29 16:38:13 +11:00 committed by Damien George
parent d7e1526593
commit a7932ae4e6
1 changed files with 24 additions and 7 deletions

View File

@ -7,11 +7,12 @@ This script works with Python 2.6, 2.7, 3.3 and 3.4.
from __future__ import print_function from __future__ import print_function
import io
import os
import re import re
import subprocess import subprocess
import sys import sys
import io import multiprocessing, multiprocessing.dummy
import os
# Extract MP_QSTR_FOO macros. # Extract MP_QSTR_FOO macros.
@ -39,11 +40,27 @@ def preprocess():
os.makedirs(os.path.dirname(args.output[0])) os.makedirs(os.path.dirname(args.output[0]))
except OSError: except OSError:
pass pass
with open(args.output[0], "w") as out_file:
if csources: def pp(flags):
subprocess.check_call(args.pp + args.cflags + csources, stdout=out_file) def run(files):
if cxxsources: return subprocess.check_output(args.pp + flags + files)
subprocess.check_call(args.pp + args.cxxflags + cxxsources, stdout=out_file)
return run
try:
cpus = multiprocessing.cpu_count()
except NotImplementedError:
cpus = 1
p = multiprocessing.dummy.Pool(cpus)
with open(args.output[0], "wb") as out_file:
for flags, sources in (
(args.cflags, csources),
(args.cxxflags, cxxsources),
):
batch_size = (len(sources) + cpus - 1) // cpus
chunks = [sources[i : i + batch_size] for i in range(0, len(sources), batch_size or 1)]
for output in p.imap(pp(flags), chunks):
out_file.write(output)
def write_out(fname, output): def write_out(fname, output):