ICU-10923 Adding unix-exec mode to buildtool and updating help page.

author Shane Carr <shane@unicode.org>

Wed, 23 Jan 2019 08:26:31 +0000 (00:26 -0800)

committer Shane F. Carr <shane@unicode.org>

Fri, 25 Jan 2019 23:34:44 +0000 (15:34 -0800)
author Shane Carr <shane@unicode.org>
Wed, 23 Jan 2019 08:26:31 +0000 (00:26 -0800)
committer Shane F. Carr <shane@unicode.org>
Fri, 25 Jan 2019 23:34:44 +0000 (15:34 -0800)
diff --git a/icu4c/source/configure b/icu4c/source/configure

index 659832e2491558f3259ee8e10ae162d0fc7c05b2..29bcec408d5d8a37c76e8a73280f185429a17cd6 100755 (executable)
--- a/icu4c/source/configure
+++ b/icu4c/source/configure
@@ -9128,16 +9128,16 @@ then
  else
      echo "Spawning Python to generate data/rules.mk..."
      PYTHONPATH="$srcdir/data" $PYTHON -m buildtool \
-        --format gnumake \
+        --mode gnumake \
          --seqmode parallel \
-        --glob_dir "$srcdir/data" \
+        --in_dir "$srcdir/data" \
          --filter_file "$ICU_DATA_FILTER_FILE" \
          > data/rules.mk
      echo "Spawning Python to generate test/testdata/rules.mk..."
      PYTHONPATH="$srcdir/test/testdata:$srcdir/data" $PYTHON -m buildtool \
-        --format gnumake \
+        --mode gnumake \
          --seqmode parallel \
-        --glob_dir "$srcdir/test/testdata" \
+        --in_dir "$srcdir/test/testdata" \
          > test/testdata/rules.mk
  fi
  
diff --git a/icu4c/source/configure.ac b/icu4c/source/configure.ac

index 80da9255f591f2d4589068cc5e659f33c223d062..b2f8446a054f74f42ce4ae2d2202b9d9a35c1edc 100644 (file)
--- a/icu4c/source/configure.ac
+++ b/icu4c/source/configure.ac
@@ -1392,16 +1392,16 @@ then
  else
      echo "Spawning Python to generate data/rules.mk..."
      PYTHONPATH="$srcdir/data" $PYTHON -m buildtool \
-        --format gnumake \
+        --mode gnumake \
          --seqmode parallel \
-        --glob_dir "$srcdir/data" \
+        --in_dir "$srcdir/data" \
          --filter_file "$ICU_DATA_FILTER_FILE" \
          > data/rules.mk
      echo "Spawning Python to generate test/testdata/rules.mk..."
      PYTHONPATH="$srcdir/test/testdata:$srcdir/data" $PYTHON -m buildtool \
-        --format gnumake \
+        --mode gnumake \
          --seqmode parallel \
-        --glob_dir "$srcdir/test/testdata" \
+        --in_dir "$srcdir/test/testdata" \
          > test/testdata/rules.mk
  fi
  
diff --git a/icu4c/source/data/BUILDRULES.py b/icu4c/source/data/BUILDRULES.py

index f305bd589a72fcec2194630eca80cdd1b940dfad..0ba6ddb7ea95cba76bd2a9011a711fcc960f365e 100644 (file)
--- a/icu4c/source/data/BUILDRULES.py
+++ b/icu4c/source/data/BUILDRULES.py
@@ -18,7 +18,7 @@ def generate(config, glob, common_vars):
      requests = []
  
      if len(glob("misc/*")) == 0:
-        print("Error: Cannot find data directory; please specify --glob_dir", file=sys.stderr)
+        print("Error: Cannot find data directory; please specify --in_dir", file=sys.stderr)
          exit(1)
  
      requests += generate_cnvalias(config, glob, common_vars)
diff --git a/icu4c/source/data/buildtool/__main__.py b/icu4c/source/data/buildtool/__main__.py

index 7ef4d981bc977e37a603255d2892b2ed97e53106..f30e6ff7593dfa278d8e1d4435ae23491216c60b 100644 (file)
--- a/icu4c/source/data/buildtool/__main__.py
+++ b/icu4c/source/data/buildtool/__main__.py
@@ -13,7 +13,7 @@ import sys
  
  from . import *
  from .comment_stripper import CommentStripper
-from .renderers import makefile, windirect
+from .renderers import makefile, unix_exec, windows_exec
  from . import filtration, utils
  import BUILDRULES
  
@@ -21,93 +21,102 @@ flag_parser = argparse.ArgumentParser(
      description = """Generates rules for building ICU binary data files from text
  and other input files in source control.
  
-You can select features using either the --whitelist or --blacklist option.
-Available features include:
+Use the --mode option to declare how to execute those rules, either exporting
+the rules to a Makefile or spawning child processes to run them immediately:
  
-{AVAILABLE_FEATURES}
-""".format(AVAILABLE_FEATURES = "\n".join("    %s" % v for v in AVAILABLE_FEATURES)),
+  --mode=gnumake prints a Makefile to standard out.
+  --mode=unix-exec spawns child processes in a Unix-like environment.
+  --mode=windows-exec spawns child processes in a Windows-like environment.
+
+Tips for --mode=unix-exec
+=========================
+
+Create two empty directories for out_dir and tmp_dir. They will get filled
+with a lot of intermediate files.
+
+Set LD_LIBRARY_PATH to include the lib directory. e.g., from icu4c/source:
+
+  $ LD_LIBRARY_PATH=lib PYTHONPATH=data python3 -m buildtool ...
+
+Once buildtool finishes, you have compiled the data, but you have not packaged
+it into a .dat or .so file. This is done by the separate pkgdata tool in bin.
+Read the docs of pkgdata:
+
+  $ LD_LIBRARY_PATH=lib ./bin/pkgdata --help
+
+Example command line to call pkgdata:
+
+  $ LD_LIBRARY_PATH=lib ./bin/pkgdata -m common -p icudt63l -c \\
+      -O data/icupkg.inc -s $OUTDIR -d $TMPDIR $TMPDIR/icudata.lst
+
+where $OUTDIR and $TMPDIR are your out and tmp directories, respectively.
+The above command will create icudt63l.dat in the tmpdir.
+
+Command-Line Arguments
+======================
+""",
      formatter_class = argparse.RawDescriptionHelpFormatter
  )
-flag_parser.add_argument(
-    "--format",
-    help = "How to output the rules to run to build ICU data.",
-    choices = ["gnumake", "windirect"],
+
+arg_group_required = flag_parser.add_argument_group("required arguments")
+arg_group_required.add_argument(
+    "--mode",
+    help = "What to do with the generated rules.",
+    choices = ["gnumake", "unix-exec", "windows-exec"],
      required = True
  )
+
  flag_parser.add_argument(
-    "--glob_dir",
-    help = "Path to data input folder (icu4c/source/data) when this script is being run.",
+    "--in_dir",
+    help = "Path to data input folder (icu4c/source/data).",
      default = "."
  )
  flag_parser.add_argument(
-    "--in_dir",
-    help = "Path to data input folder (icu4c/source/data) for file processing. Not used in gnumake format.",
-    default = "."
+    "--filter_file",
+    metavar = "PATH",
+    help = "Path to an ICU data filter JSON file.",
+    default = None
  )
  flag_parser.add_argument(
+    "--collation_ucadata",
+    help = "Which data set to use for ucadata in collation.",
+    choices = ["unihan", "implicithan"],
+    default = "unihan"
+)
+flag_parser.add_argument(
+    "--seqmode",
+    help = "Whether to optimize rules to be run sequentially (fewer threads) or in parallel (many threads). Defaults to 'sequential', which is better for unix-exec and windows-exec modes. 'parallel' is often better for massively parallel build systems.",
+    choices = ["sequential", "parallel"],
+    default = "sequential"
+)
+
+arg_group_exec = flag_parser.add_argument_group("arguments for unix-exec and windows-exec modes")
+arg_group_exec.add_argument(
      "--out_dir",
-    help = "Path to where to save output data files. Not used in gnumake format.",
+    help = "Path to where to save output data files.",
      default = "icudata"
  )
-flag_parser.add_argument(
+arg_group_exec.add_argument(
      "--tmp_dir",
-    help = "Path to where to save temporary files. Not used in gnumake format.",
+    help = "Path to where to save temporary files.",
      default = "icutmp"
  )
-flag_parser.add_argument(
+arg_group_exec.add_argument(
      "--tool_dir",
-    help = "Path to where to find binary tools (genrb, genbrk, etc). Used for 'windirect' format only.",
-    default = "../tool"
+    help = "Path to where to find binary tools (genrb, etc).",
+    default = "../bin"
  )
-flag_parser.add_argument(
+arg_group_exec.add_argument(
      "--tool_cfg",
-    help = "The build configuration of the tools. Used for 'windirect' format only.",
+    help = "The build configuration of the tools. Used in 'windows-exec' mode only.",
      default = "x86/Debug"
  )
-flag_parser.add_argument(
-    "--seqmode",
-    help = "Whether to optimize rules to be run sequentially (fewer threads) or in parallel (many threads).",
-    choices = ["sequential", "parallel"],
-    default = "parallel"
-)
-flag_parser.add_argument(
-    "--collation_ucadata",
-    help = "Which data set to use for ucadata in collation.",
-    choices = ["unihan", "implicithan"],
-    default = "unihan"
-)
-features_group = flag_parser.add_mutually_exclusive_group()
-features_group.add_argument(
-    "--blacklist",
-    metavar = "FEATURE",
-    help = "A list of one or more features to disable; all others will be enabled by default. New users should favor a blacklist to ensure important data is not left out.",
-    nargs = "+",
-    choices = AVAILABLE_FEATURES
-)
-features_group.add_argument(
-    "--whitelist",
-    metavar = "FEATURE",
-    help = "A list of one or more features to enable; all others will be disabled by default.",
-    nargs = "+",
-    choices = AVAILABLE_FEATURES
-)
-features_group.add_argument(
-    "--filter_file",
-    help = "A path to a filter file.",
-    default = None
-)
  
  
  class Config(object):
  
      def __init__(self, args):
          # Process arguments
-        if args.whitelist:
-            self._feature_set = set(args.whitelist)
-        elif args.blacklist:
-            self._feature_set = set(AVAILABLE_FEATURES) - set(args.blacklist)
-        else:
-            self._feature_set = set(AVAILABLE_FEATURES)
          self.max_parallel = (args.seqmode == "parallel")
          # Either "unihan" or "implicithan"
          self.coll_han_type = args.collation_ucadata
@@ -152,16 +161,12 @@ class Config(object):
          except ImportError:
              pass
  
-    def has_feature(self, feature_name):
-        assert feature_name in AVAILABLE_FEATURES
-        return feature_name in self._feature_set
-
  
  def main():
      args = flag_parser.parse_args()
      config = Config(args)
  
-    if args.format == "gnumake":
+    if args.mode == "gnumake":
          makefile_vars = {
              "IN_DIR": "$(srcdir)",
              "INDEX_NAME": "res_index"
@@ -171,10 +176,12 @@ def main():
              key: "$(%s)" % key
              for key in list(makefile_vars.keys()) + makefile_env
          }
-        common["GLOB_DIR"] = args.glob_dir
+        common["GLOB_DIR"] = args.in_dir
      else:
          common = {
-            "GLOB_DIR": args.glob_dir,
+            # GLOB_DIR is used now, whereas IN_DIR is used during execution phase.
+            # There is no useful distinction in unix-exec or windows-exec mode.
+            "GLOB_DIR": args.in_dir,
              "IN_DIR": args.in_dir,
              "OUT_DIR": args.out_dir,
              "TMP_DIR": args.tmp_dir,
@@ -185,11 +192,11 @@ def main():
  
      def glob(pattern):
          result_paths = pyglob.glob("{IN_DIR}/{PATTERN}".format(
-            IN_DIR = args.glob_dir,
+            IN_DIR = args.in_dir,
              PATTERN = pattern
          ))
          # For the purposes of buildtool, force Unix-style directory separators.
-        return [v.replace("\\", "/")[len(args.glob_dir)+1:] for v in sorted(result_paths)]
+        return [v.replace("\\", "/")[len(args.in_dir)+1:] for v in sorted(result_paths)]
  
      requests = BUILDRULES.generate(config, glob, common)
      requests = filtration.apply_filters(requests, config)
@@ -197,23 +204,30 @@ def main():
  
      build_dirs = utils.compute_directories(requests)
  
-    if args.format == "gnumake":
+    if args.mode == "gnumake":
          print(makefile.get_gnumake_rules(
              build_dirs,
              requests,
              makefile_vars,
              common_vars = common
          ))
-    elif args.format == "windirect":
-        return windirect.run(
-            build_dirs,
-            requests,
+    elif args.mode == "windows-exec":
+        return windows_exec.run(
+            build_dirs = build_dirs,
+            requests = requests,
              common_vars = common,
              tool_dir = args.tool_dir,
              tool_cfg = args.tool_cfg
          )
+    elif args.mode == "unix-exec":
+        return unix_exec.run(
+            build_dirs = build_dirs,
+            requests = requests,
+            common_vars = common,
+            tool_dir = args.tool_dir
+        )
      else:
-        print("Format not supported: %s" % args.format)
+        print("Mode not supported: %s" % args.mode)
          return 1
      return 0
  
diff --git a/icu4c/source/data/buildtool/renderers/windirect.py b/icu4c/source/data/buildtool/renderers/common_exec.py

similarity index 68%

rename from icu4c/source/data/buildtool/renderers/windirect.py

rename to icu4c/source/data/buildtool/renderers/common_exec.py

index 99911519072c3d467d7dafe5d61f48a746103cc2..803d416296986758866361ffdf904c0ccac87222 100644 (file)
--- a/icu4c/source/data/buildtool/renderers/windirect.py
+++ b/icu4c/source/data/buildtool/renderers/common_exec.py
@@ -18,10 +18,10 @@ def run(build_dirs, requests, common_vars, **kwargs):
          if status != 0:
              print("!!! ERROR executing above command line: exit code %d" % status)
              return 1
-    print("windirect: All data build commands executed")
+    print("All data build commands executed")
      return 0
  
-def run_helper(request, common_vars, tool_dir, tool_cfg, **kwargs):
+def run_helper(request, common_vars, is_windows, tool_dir, tool_cfg=None, **kwargs):
      if isinstance(request, PrintFileRequest):
          output_path = "{DIRNAME}/{FILENAME}".format(
              DIRNAME = utils.dir_for(request.output_file).format(**common_vars),
@@ -48,12 +48,20 @@ def run_helper(request, common_vars, tool_dir, tool_cfg, **kwargs):
          return 0
  
      assert isinstance(request.tool, IcuTool)
-    cmd_template = "{TOOL_DIR}/{TOOL}/{TOOL_CFG}/{TOOL}.exe {{ARGS}}".format(
-        TOOL_DIR = tool_dir,
-        TOOL_CFG = tool_cfg,
-        TOOL = request.tool.name,
-        **common_vars
-    )
+    if is_windows:
+        cmd_template = "{TOOL_DIR}/{TOOL}/{TOOL_CFG}/{TOOL}.exe {{ARGS}}".format(
+            TOOL_DIR = tool_dir,
+            TOOL_CFG = tool_cfg,
+            TOOL = request.tool.name,
+            **common_vars
+        )
+    else:
+        cmd_template = "{TOOL_DIR}/{TOOL} {{ARGS}}".format(
+            TOOL_DIR = tool_dir,
+            TOOL = request.tool.name,
+            **common_vars
+        )
+
      if isinstance(request, RepeatedExecutionRequest):
          for loop_vars in utils.repeated_execution_request_looper(request):
              command_line = utils.format_repeated_request_command(
@@ -62,18 +70,24 @@ def run_helper(request, common_vars, tool_dir, tool_cfg, **kwargs):
                  loop_vars,
                  common_vars
              )
-            # TODO: Is this / to \ substitution too aggressive?
-            command_line = command_line.replace("/", "\\")
+            if is_windows:
+                # Note: this / to \ substitution may be too aggressive?
+                command_line = command_line.replace("/", "\\")
              print("Running: %s" % command_line)
-            res = subprocess.run(command_line)
+            res = subprocess.run(command_line, shell=True)
              if res.returncode != 0:
                  return res.returncode
          return 0
      if isinstance(request, SingleExecutionRequest):
-        command_line = utils.format_single_request_command(request, cmd_template, common_vars)
-        # TODO: Is this / to \ substitution too aggressive?
-        command_line = command_line.replace("/", "\\")
+        command_line = utils.format_single_request_command(
+            request,
+            cmd_template,
+            common_vars
+        )
+        if is_windows:
+            # Note: this / to \ substitution may be too aggressive?
+            command_line = command_line.replace("/", "\\")
          print("Running: %s" % command_line)
-        res = subprocess.run(command_line)
+        res = subprocess.run(command_line, shell=True)
          return res.returncode
      assert False
diff --git a/icu4c/source/data/buildtool/renderers/unix_exec.py b/icu4c/source/data/buildtool/renderers/unix_exec.py

new file mode 100644 (file)

index 0000000..468f413
--- /dev/null
+++ b/icu4c/source/data/buildtool/renderers/unix_exec.py
@@ -0,0 +1,7 @@
+# Copyright (C) 2018 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+
+from . import common_exec
+
+def run(**kwargs):
+    return common_exec.run(is_windows=False, **kwargs)
diff --git a/icu4c/source/data/buildtool/renderers/windows_exec.py b/icu4c/source/data/buildtool/renderers/windows_exec.py

new file mode 100644 (file)

index 0000000..731801e
--- /dev/null
+++ b/icu4c/source/data/buildtool/renderers/windows_exec.py
@@ -0,0 +1,7 @@
+# Copyright (C) 2018 and later: Unicode, Inc. and others.
+# License & terms of use: http://www.unicode.org/copyright.html
+
+from . import common_exec
+
+def run(**kwargs):
+    return common_exec.run(is_windows=True, **kwargs)
diff --git a/icu4c/source/data/makedata.mak b/icu4c/source/data/makedata.mak

index 85b44881577ccee3d766f535ea33bfb4423e3767..06fcc7267a7c19fb2a4e2a493204844756c40da4 100644 (file)
--- a/icu4c/source/data/makedata.mak
+++ b/icu4c/source/data/makedata.mak
@@ -234,7 +234,7 @@ $(TOOLS_TS): "$(ICUTOOLS)\genrb\$(CFGTOOLS)\genrb.exe" "$(ICUTOOLS)\gencnval\$(C
  $(COREDATA_TS):
         @cd "$(ICUSRCDATA)"
         py -3 -m buildtool \
-               --format windirect \
+               --mode windows-exec \
                 --in_dir "$(ICUSRCDATA)" \
                 --tool_dir "$(ICUTOOLS)" \
                 --tool_cfg "$(CFG)" \
diff --git a/icu4c/source/test/testdata/testdata.mak b/icu4c/source/test/testdata/testdata.mak

index 8d89f0019f99a6c270acb696994dad1297a03c90..9d799f007440170f96cc89b67626db6a97b91cfb 100644 (file)
--- a/icu4c/source/test/testdata/testdata.mak
+++ b/icu4c/source/test/testdata/testdata.mak
@@ -36,10 +36,9 @@ CREATE_DIRS :
         @echo Building test data
         set PYTHONPATH=$(ICUSRCDATA);%PYTHONPATH%
         py -3 -m buildtool \
-               --format windirect \
+               --mode windows-exec \
                 --tool_dir "$(ICUTOOLS)" \
                 --tool_cfg "$(CFG)" \
-               --glob_dir "$(TESTDATA)" \
                 --in_dir "$(TESTDATA)" \
                 --tmp_dir "$(TESTDATATMP)" \
                 --out_dir "$(TESTDATABLD)"
author	Shane Carr <shane@unicode.org>
	Wed, 23 Jan 2019 08:26:31 +0000 (00:26 -0800)
committer	Shane F. Carr <shane@unicode.org>
	Fri, 25 Jan 2019 23:34:44 +0000 (15:34 -0800)
icu4c/source/configure		patch \| blob \| history
icu4c/source/configure.ac		patch \| blob \| history
icu4c/source/data/BUILDRULES.py		patch \| blob \| history
icu4c/source/data/buildtool/__main__.py		patch \| blob \| history
icu4c/source/data/buildtool/renderers/common_exec.py	[moved from icu4c/source/data/buildtool/renderers/windirect.py with 68% similarity]	patch \| blob \| history
icu4c/source/data/buildtool/renderers/unix_exec.py	[new file with mode: 0644]	patch \| blob
icu4c/source/data/buildtool/renderers/windows_exec.py	[new file with mode: 0644]	patch \| blob
icu4c/source/data/makedata.mak		patch \| blob \| history
icu4c/source/test/testdata/testdata.mak		patch \| blob \| history