apache · junrushao · Feb 4, 2021 · Jan 15, 2021 · Jan 26, 2021 · Jan 26, 2021
diff --git a/python/gen_requirements.py b/python/gen_requirements.py
@@ -0,0 +1,391 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""TVM Python requriements.txt generator.
+
+This script generates a set of requirements.txt files (stored in `./requirements`) that describe
+TVM's Python dependencies.
+
+## Pieces
+
+TVM can be roughly broken into these named pieces along the lines of Python dependencies:
+
+- "core": A core piece, which is intended to be buildable with very few external dependencies. Users
+  can use Relay, compile models, and run autotuning with this part.
+- "importer-<tool>": Model importers, which convert models defined in various other tools (i.e.
+  TensorFlow, PyTorch, etc) into Relay models.
+- Extra features (i.e. XGBoost in AutoTVM). These enhance TVM's functionality, but aren't required
+  for basic operation.
+
+## What this tool does
+
+From these pieces, this tool builds:
+ - requirements/<name>.txt - Python dependencies for each named piece above, `<name>` is the same as
+   the quoted piece name.
+ - requirements/all.txt - Consolidated Python dependencies for all pieces, excluding dev below.
+ - requirements/dev.txt - Python dependencies needed to develop TVM, such as lint and test tools.
+
+The data representing each piece is contained in the two maps below.
+"""
+
+import argparse
+import collections
+import os
+import re
+import textwrap
+import sys
+
+# Maps named TVM piece (see description above) to a list of names of Python packages. Please use
+# alphabetical order for each package list, and do not add version constraints here!
+REQUIREMENTS_BY_PIECE = [
+    # Base requirements needed to install tvm with no extras.
+    ("core", [
+        "attrs",
+        "decorator",
+        "numpy",
+        "psutil",
+        "scipy",
+        "synr",
+    ]),
+
+    # Relay frontends.
+    ("importer-caffe2", ["torch"]),
+    ("importer-coreml", ["coremltools"]),
+    ("importer-darknet", ["opencv-python"]),
+    ("importer-keras", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-onnx", ["future", "onnx", "onnxruntime", "torch", "torchvision"]),
+    ("importer-pytorch", ["future", "torch", "torchvision"]),
+    ("importer-tensorflow", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-tflite", ["tensorflow", "tensorflow-estimator", "tflite"]),
+
+    ("tvmc", ["onnx", "onnxruntime", "tensorflow", "tflite", "torch", "torchvision"]),
+
+    # XGBoost, useful for autotuning on some targets.
+    ("xgboost", ["torch"]),
+
+    # Development requirements
+    ("dev", ["matplotlib", "pillow"]),
+]
+
+# Maps a named Python package (which should appear in REQUIREMENTS_BY_PIECE above) to a
+# semver or pip version constraint. Semver constraints are translated into requirements.txt
+# constraints.
+CONSTRAINTS = [
+  ("onnx", ">=1.7.0"),
+  ("onnxruntime", ">=1.0.0"),
+  ("pillow", "<7"),
+  ("synr", ">=0.2.1"),
+  ("tensorflow", ">=2.1.0"),
+  ("tflite", ">=2.1.0"),
+  ("torch", "^1.7.0"),
+  ("torchvision", ">=0.5.0"),
+]
+
+################################################################################
+# End of configuration options.
+################################################################################
+
+
+
+
+# Required keys in REQUIREMENTS_BY_PIECE.
+REQUIRED_PIECES = ["core", "dev"]
+
+# Regex to validates piece names.
+PIECE_REGEX = re.compile(r"^[a-z0-9][a-z0-9-]*", re.IGNORECASE)
+
+# Regex to match a constraint specification. Multiple constraints are not supported.
+CONSTRAINT_REGEX = re.compile(r"(?:\^|\<|(?:<=)|(?:==)|(?:>=)|\>)[^<>=\^,]+")
+
+# Regex for parsing semantic versions. See
+# https://semver.org/#is-there-a-suggested-regular-expression-regex-to-check-a-semver-string
+SEMVER_REGEX = re.compile(r"^(?P<major>0|[1-9]\d*)\.(?P<minor>0|[1-9]\d*)\.(?P<patch>0|[1-9]\d*)(?:-(?P<prerelease>(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*)(?:\.(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*))*))?(?:\+(?P<buildmetadata>[0-9a-zA-Z-]+(?:\.[0-9a-zA-Z-]+)*))?$")
+
+
+def validate_requirements_by_piece():
+  problems = []
+
+  unseen_required_pieces = set(REQUIRED_PIECES)
+  seen_pieces = set()
+
+  # Ensure that core is listed first and dev is listed last.
+  saw_core = False
+  saw_dev = False
+
+  if not isinstance(REQUIREMENTS_BY_PIECE, (list, tuple)):
+    problems.append(f"must be list or tuple, see {REQUIREMENTS_BY_PIECE!r}")
+
+  for piece, deps in REQUIREMENTS_BY_PIECE:
+    if not isinstance(piece, str):
+      problems.append(f"key {piece!r}: must be str, see {piece!r}")
+      continue
+
+    if piece in unseen_required_pieces:
+      unseen_required_pieces.remove(piece)
+
+    piece_lower = piece.lower()
+    if piece_lower in seen_pieces:
+      problems.append(f"piece {piece}: listed twice")
+
+    seen_pieces.add(piece_lower)
+
+    if not saw_core and piece != "core":
+      problems.append(f'must list "core" before {piece}')
+    elif piece == "core":
+      saw_core = True
+
+    if saw_dev:
+      problems.append(f'must list "dev" last')
+    elif piece == "dev":
+      saw_dev = True
+
+    if not isinstance(deps, (list, tuple)):
+      problems.append(f'value for key "{piece}" should be list or tuple, see {deps!r}')
+      continue
+
+    if list(sorted(deps)) != list(deps):
+      problems.append(f"deps for key {piece} must be sorted. Correct order:\n  {list(sorted(deps))!r}")
+
+    piece_deps = set()
+    for d in deps:
+      if CONSTRAINT_REGEX.search(d):
+        problems.append(f"for piece {piece}: dependency {d} should not specify a version. "
+                        "Add it to CONSTRAINTS instead.")
+
+      if d.lower() in piece_deps:
+        problems.append(f'for piece {piece}: dependency {d} listed twice')
+
+      piece_deps.add(d.lower())
+
+  extras_pieces = [k for (k, _) in REQUIREMENTS_BY_PIECE if k not in ("dev", "core")]
+  sorted_extras_pieces = list(sorted(extras_pieces))
+  if sorted_extras_pieces != list(extras_pieces):
+    problems.append('pieces other than "core" and "dev" must appear in alphabetical order'
+                    f"{sorted_extras_pieces}")
+
+  return problems
+
+
+def parse_semver(package, constraint, problems):
+  """Parse a semantic versioning constraint of the form "^X.[.Y[.Z[...]]]]"
+
+  Parameters
+  ----------
+  package : str
+      Name of the package specifying this constraint, for reporting problems.
+  constraint : str
+      The semver constraint. Must start with "^"
+  problems : List[str]
+      A list of strings describing problems that have occurred validating the configuration.
+      Problems encountered while validating constraint are appended to this list.
+
+  Returns
+  -------
+  List[str], int :
+      A 2-tuple. The first element is a list containing an entry for each component in the
+      semver string (components separated by "."). The second element is the index of the
+      component in the list which must not change to meet the semver constraint.
+
+      See "Caret requirements" at https://python-poetry.org/docs/versions/.
+  """
+  m = SEMVER_REGEX.match(constraint[1:])
+  if not m:
+    problems.append(f"{package}: invalid semver constraint {constraint}")
+    return [], 0
+
+  min_ver_parts = list(m.groups())
+
+  # Remove the end
+  while min_ver_parts and min_ver_parts[-1] is None or not min_ver_parts[-1].strip():
+    min_ver_parts.pop()
+
+  for i, p in enumerate(min_ver_parts):
+    try:
+      x = int(p.strip())
+    except ValueError as p:
+      if i == len(parts) - 1 and i > 0:
+        # If a pre-release tag is specified (i.e. 1.2.0pre3), allow.
+        return min_ver_parts, i - 1
+
+      problems.append(
+        f"{package}: semver constraint with non-numeric leading component: {constraint}")
+      return [], 0
+
+    if x:
+      return min_ver_parts, i
+
+  else:
+    # All 0's
+    return min_ver_parts, 0
+
+
+def validate_constraints():
+  problems = []
+
+  if not isinstance(CONSTRAINTS, (list, tuple)):
+    problems.append(f"must be list or tuple, see: {CONSTRAINTS!r}")
+
+  seen_packages = set()
+  all_deps = set()
+  for _, deps in REQUIREMENTS_BY_PIECE:
+    for d in deps:
+      all_deps.add(d.lower())
+
+  for package, constraint in CONSTRAINTS:
+    if package in seen_packages:
+      problems.append(f"{package}: specified twice")
+
+    if package.lower() not in all_deps:
+      problems.append(f"{package}: not specified in REQUIREMENTS_BY_PIECE")
+
+    if not CONSTRAINT_REGEX.match(constraint):
+      problems.append(f'{package}: constraint "{constraint}" does not look like a valid constraint')
+
+    if constraint.startswith("^"):
+      parse_semver(package, constraint, problems)
+
+  all_constrained_packages = [p for (p, _) in CONSTRAINTS]
+  sorted_constrained_packages = list(sorted(all_constrained_packages))
+  if sorted_constrained_packages != all_constrained_packages:
+    problems.append("CONSTRAINTS entries should be in this sorted order: "
+                    f'{sorted_constrained_packages}')
+
+  return problems
+
+
+class ValidationError(Exception):
+  """Raised when a validation error occurs."""
+
+  @staticmethod
+  def format_problems(config, problems):
+    formatted = []
+    for p in problems:
+      assert isinstance(p, str), f"problems element not a str: {p}"
+      formatted.append('\n'.join(
+        textwrap.wrap(f"{config}: {p}", width=80, initial_indent=" * ", subsequent_indent="   ")))
+
+    return '\n'.join(formatted)
+
+  def __init__(self, config, problems):
+    super(ValidationError, self).__init__(self.format_problems(config, problems))
+    self.problems = problems
+
+
+def validate_or_raise():
+  problems = validate_requirements_by_piece()
+  if problems:
+    raise ValidationError("REQUIREMENTS_BY_PIECE", problems)
+
+  problems = validate_constraints()
+  if problems:
+    raise ValidationError("CONSTRAINTS", problems)
+
+
+def semver_to_requirements(piece, dep, constraint, joined_deps):
+  problems = []
+  min_ver_parts, fixed_index = parse_semver(dep, constraint, problems)
+  assert not problems
+
+  # i is now the index of the version component which must not change.
+  try:
+    fixed_part = int(min_ver_parts[fixed_index])
+  except ValueError:
+    problems.append(
+      f"piece {piece}: dependency {dep} has semver constraint with non-integer leading parts: {ver}")
+    return
+
+  max_ver_parts = (min_ver_parts[:fixed_index] +
+                   [str(int(min_ver_parts[fixed_index]) + 1)] +
+                   ["0" for _ in min_ver_parts[fixed_index + 1:]])
+  joined_deps.append(f'{dep}>={".".join(min_ver_parts)},<{".".join(max_ver_parts)}')
+
+
+def join_requirements():
+  """Validate, then join REQUIRMENTS_BY_PIECE against CONSTRAINTS and return the result.
+
+  Returns
+  -------
+  An OrderedDict containing REQUIREMENTS_BY_PIECE, except any dependency mentioned in CONSTRAINTS
+  is replaced by a setuptools-compatible constraint.
+  """
+  validate_or_raise()
+
+  constraints_map = collections.OrderedDict(
+    [(p.lower(), c) for (p, c) in CONSTRAINTS])
+
+  to_return = collections.OrderedDict()
+  all_deps = set()
+  for piece, deps in REQUIREMENTS_BY_PIECE:
+    joined_deps = []
+    for d in deps:
+      constraint = constraints_map.get(d.lower())
+      if constraint is None:
+        joined_deps.append(d)
+        continue
+
+      if constraint[0] == "^":
+        # Translate semver to requirements:
+        semver_to_requirements(piece, d, constraint, joined_deps)
+      else:
+        joined_deps.append(f"{d}{constraint}")
+
+    if piece != "dev":
+      all_deps.update(joined_deps)
+
+    to_return[piece] = joined_deps
+
+  to_return["all"] = all_deps
+
+  return to_return
+
+
+def parse_args():
+  parser = argparse.ArgumentParser()
+  parser.add_argument("--lint", action="store_true",
+                      help="Just lint dependencies, don't generate anything")
+  return parser.parse_args()
+
+
+def main():
+  args = parse_args()
+  try:
+    joined_deps = join_requirements()
+  except ValidationError as e:
+    print(f"ERROR: invalid requirements configuration in {__file__}:", file=sys.stderr)
+    print(str(e), file=sys.stderr)
+    sys.exit(2)
+
+  if args.lint:
+    sys.exit(0)
+
+  output_dir = os.path.join(os.path.dirname(__file__), "requirements")
+  if not os.path.exists(output_dir):
+    os.makedirs(output_dir)
+  elif not os.path.isdir(output_dir):
+    print(f"ERROR: output directory {output_dir} exists but is not a dir. Delete it",
+          file=sys.stderr)
+    sys.exit(2)
+
+  for piece, deps in joined_deps.items():
+    with open(os.path.join(output_dir, f"{piece}.txt"), "w") as f:
+      for d in deps:
+        f.write(f"{d}{os.linesep}")
+
+
+if __name__ == "__main__":
+  main()