mdw-octoml commented on a change in pull request #7289:
URL: https://github.com/apache/tvm/pull/7289#discussion_r558479917



##########
File path: python/gen_requirements.py
##########
@@ -0,0 +1,391 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""TVM Python requriements.txt generator.
+
+This script generates a set of requirements.txt files (stored in 
`./requirements`) that describe
+TVM's Python dependencies.
+
+## Pieces
+
+TVM can be roughly broken into these named pieces along the lines of Python 
dependencies:
+
+- "core": A core piece, which is intended to be buildable with very few 
external dependencies. Users
+  can use Relay, compile models, and run autotuning with this part.
+- "importer-<tool>": Model importers, which convert models defined in various 
other tools (i.e.
+  TensorFlow, PyTorch, etc) into Relay models.
+- Extra features (i.e. XGBoost in AutoTVM). These enhance TVM's functionality, 
but aren't required
+  for basic operation.
+
+## What this tool does
+
+From these pieces, this tool builds:
+ - requirements/<name>.txt - Python dependencies for each named piece above, 
`<name>` is the same as
+   the quoted piece name.
+ - requirements/all.txt - Consolidated Python dependencies for all pieces, 
excluding dev below.
+ - requirements/dev.txt - Python dependencies needed to develop TVM, such as 
lint and test tools.
+
+The data representing each piece is contained in the two maps below.
+"""
+
+import argparse
+import collections
+import os
+import re
+import textwrap
+import sys
+
+# Maps named TVM piece (see description above) to a list of names of Python 
packages. Please use
+# alphabetical order for each package list, and do not add version constraints 
here!
+REQUIREMENTS_BY_PIECE = [
+    # Base requirements needed to install tvm with no extras.
+    ("core", [
+        "attrs",
+        "decorator",
+        "numpy",
+        "psutil",
+        "scipy",
+        "synr",
+    ]),
+
+    # Relay frontends.
+    ("importer-caffe2", ["torch"]),
+    ("importer-coreml", ["coremltools"]),
+    ("importer-darknet", ["opencv-python"]),
+    ("importer-keras", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-onnx", ["future", "onnx", "onnxruntime", "torch", 
"torchvision"]),
+    ("importer-pytorch", ["future", "torch", "torchvision"]),
+    ("importer-tensorflow", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-tflite", ["tensorflow", "tensorflow-estimator", "tflite"]),
+
+    ("tvmc", ["onnx", "onnxruntime", "tensorflow", "tflite", "torch", 
"torchvision"]),
+
+    # XGBoost, useful for autotuning on some targets.
+    ("xgboost", ["torch"]),
+
+    # Development requirements
+    ("dev", ["matplotlib", "pillow"]),
+]
+
+# Maps a named Python package (which should appear in REQUIREMENTS_BY_PIECE 
above) to a
+# semver or pip version constraint. Semver constraints are translated into 
requirements.txt
+# constraints.
+CONSTRAINTS = [
+  ("onnx", ">=1.7.0"),
+  ("onnxruntime", ">=1.0.0"),
+  ("pillow", "<7"),
+  ("synr", ">=0.2.1"),
+  ("tensorflow", ">=2.1.0"),
+  ("tflite", ">=2.1.0"),
+  ("torch", "^1.7.0"),
+  ("torchvision", ">=0.5.0"),
+]
+
+################################################################################
+# End of configuration options.
+################################################################################
+
+
+
+
+# Required keys in REQUIREMENTS_BY_PIECE.
+REQUIRED_PIECES = ["core", "dev"]
+
+# Regex to validates piece names.
+PIECE_REGEX = re.compile(r"^[a-z0-9][a-z0-9-]*", re.IGNORECASE)
+
+# Regex to match a constraint specification. Multiple constraints are not 
supported.
+CONSTRAINT_REGEX = re.compile(r"(?:\^|\<|(?:<=)|(?:==)|(?:>=)|\>)[^<>=\^,]+")

Review comment:
       Have you considered using https://pypi.org/project/semver/ instead of 
rolling your own? Or is this script required to run with no deps?

##########
File path: python/gen_requirements.py
##########
@@ -0,0 +1,391 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""TVM Python requriements.txt generator.
+
+This script generates a set of requirements.txt files (stored in 
`./requirements`) that describe
+TVM's Python dependencies.
+
+## Pieces
+
+TVM can be roughly broken into these named pieces along the lines of Python 
dependencies:
+
+- "core": A core piece, which is intended to be buildable with very few 
external dependencies. Users
+  can use Relay, compile models, and run autotuning with this part.
+- "importer-<tool>": Model importers, which convert models defined in various 
other tools (i.e.
+  TensorFlow, PyTorch, etc) into Relay models.
+- Extra features (i.e. XGBoost in AutoTVM). These enhance TVM's functionality, 
but aren't required
+  for basic operation.
+
+## What this tool does
+
+From these pieces, this tool builds:
+ - requirements/<name>.txt - Python dependencies for each named piece above, 
`<name>` is the same as
+   the quoted piece name.
+ - requirements/all.txt - Consolidated Python dependencies for all pieces, 
excluding dev below.
+ - requirements/dev.txt - Python dependencies needed to develop TVM, such as 
lint and test tools.
+
+The data representing each piece is contained in the two maps below.
+"""
+
+import argparse
+import collections
+import os
+import re
+import textwrap
+import sys
+
+# Maps named TVM piece (see description above) to a list of names of Python 
packages. Please use
+# alphabetical order for each package list, and do not add version constraints 
here!
+REQUIREMENTS_BY_PIECE = [
+    # Base requirements needed to install tvm with no extras.
+    ("core", [
+        "attrs",
+        "decorator",
+        "numpy",
+        "psutil",
+        "scipy",
+        "synr",
+    ]),
+
+    # Relay frontends.
+    ("importer-caffe2", ["torch"]),
+    ("importer-coreml", ["coremltools"]),
+    ("importer-darknet", ["opencv-python"]),
+    ("importer-keras", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-onnx", ["future", "onnx", "onnxruntime", "torch", 
"torchvision"]),
+    ("importer-pytorch", ["future", "torch", "torchvision"]),
+    ("importer-tensorflow", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-tflite", ["tensorflow", "tensorflow-estimator", "tflite"]),
+
+    ("tvmc", ["onnx", "onnxruntime", "tensorflow", "tflite", "torch", 
"torchvision"]),
+
+    # XGBoost, useful for autotuning on some targets.
+    ("xgboost", ["torch"]),
+
+    # Development requirements
+    ("dev", ["matplotlib", "pillow"]),
+]
+
+# Maps a named Python package (which should appear in REQUIREMENTS_BY_PIECE 
above) to a
+# semver or pip version constraint. Semver constraints are translated into 
requirements.txt
+# constraints.
+CONSTRAINTS = [
+  ("onnx", ">=1.7.0"),
+  ("onnxruntime", ">=1.0.0"),
+  ("pillow", "<7"),
+  ("synr", ">=0.2.1"),
+  ("tensorflow", ">=2.1.0"),
+  ("tflite", ">=2.1.0"),
+  ("torch", "^1.7.0"),
+  ("torchvision", ">=0.5.0"),
+]
+
+################################################################################
+# End of configuration options.
+################################################################################
+
+
+
+
+# Required keys in REQUIREMENTS_BY_PIECE.
+REQUIRED_PIECES = ["core", "dev"]
+
+# Regex to validates piece names.
+PIECE_REGEX = re.compile(r"^[a-z0-9][a-z0-9-]*", re.IGNORECASE)
+
+# Regex to match a constraint specification. Multiple constraints are not 
supported.
+CONSTRAINT_REGEX = re.compile(r"(?:\^|\<|(?:<=)|(?:==)|(?:>=)|\>)[^<>=\^,]+")
+
+# Regex for parsing semantic versions. See
+# 
https://semver.org/#is-there-a-suggested-regular-expression-regex-to-check-a-semver-string
+SEMVER_REGEX = 
re.compile(r"^(?P<major>0|[1-9]\d*)\.(?P<minor>0|[1-9]\d*)\.(?P<patch>0|[1-9]\d*)(?:-(?P<prerelease>(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*)(?:\.(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*))*))?(?:\+(?P<buildmetadata>[0-9a-zA-Z-]+(?:\.[0-9a-zA-Z-]+)*))?$")
+
+
+def validate_requirements_by_piece():

Review comment:
       For new code I would recommend using Python type annotations.

##########
File path: python/gen_requirements.py
##########
@@ -0,0 +1,391 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""TVM Python requriements.txt generator.
+
+This script generates a set of requirements.txt files (stored in 
`./requirements`) that describe
+TVM's Python dependencies.
+
+## Pieces
+
+TVM can be roughly broken into these named pieces along the lines of Python 
dependencies:
+
+- "core": A core piece, which is intended to be buildable with very few 
external dependencies. Users
+  can use Relay, compile models, and run autotuning with this part.
+- "importer-<tool>": Model importers, which convert models defined in various 
other tools (i.e.
+  TensorFlow, PyTorch, etc) into Relay models.
+- Extra features (i.e. XGBoost in AutoTVM). These enhance TVM's functionality, 
but aren't required
+  for basic operation.
+
+## What this tool does
+
+From these pieces, this tool builds:
+ - requirements/<name>.txt - Python dependencies for each named piece above, 
`<name>` is the same as
+   the quoted piece name.
+ - requirements/all.txt - Consolidated Python dependencies for all pieces, 
excluding dev below.
+ - requirements/dev.txt - Python dependencies needed to develop TVM, such as 
lint and test tools.
+
+The data representing each piece is contained in the two maps below.
+"""
+
+import argparse
+import collections
+import os
+import re
+import textwrap
+import sys
+
+# Maps named TVM piece (see description above) to a list of names of Python 
packages. Please use
+# alphabetical order for each package list, and do not add version constraints 
here!
+REQUIREMENTS_BY_PIECE = [
+    # Base requirements needed to install tvm with no extras.
+    ("core", [
+        "attrs",
+        "decorator",
+        "numpy",
+        "psutil",
+        "scipy",
+        "synr",
+    ]),
+
+    # Relay frontends.
+    ("importer-caffe2", ["torch"]),
+    ("importer-coreml", ["coremltools"]),
+    ("importer-darknet", ["opencv-python"]),
+    ("importer-keras", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-onnx", ["future", "onnx", "onnxruntime", "torch", 
"torchvision"]),
+    ("importer-pytorch", ["future", "torch", "torchvision"]),
+    ("importer-tensorflow", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-tflite", ["tensorflow", "tensorflow-estimator", "tflite"]),
+
+    ("tvmc", ["onnx", "onnxruntime", "tensorflow", "tflite", "torch", 
"torchvision"]),
+
+    # XGBoost, useful for autotuning on some targets.
+    ("xgboost", ["torch"]),
+
+    # Development requirements
+    ("dev", ["matplotlib", "pillow"]),
+]
+
+# Maps a named Python package (which should appear in REQUIREMENTS_BY_PIECE 
above) to a
+# semver or pip version constraint. Semver constraints are translated into 
requirements.txt
+# constraints.
+CONSTRAINTS = [
+  ("onnx", ">=1.7.0"),
+  ("onnxruntime", ">=1.0.0"),
+  ("pillow", "<7"),
+  ("synr", ">=0.2.1"),
+  ("tensorflow", ">=2.1.0"),
+  ("tflite", ">=2.1.0"),
+  ("torch", "^1.7.0"),
+  ("torchvision", ">=0.5.0"),
+]
+
+################################################################################
+# End of configuration options.
+################################################################################
+
+
+
+
+# Required keys in REQUIREMENTS_BY_PIECE.
+REQUIRED_PIECES = ["core", "dev"]
+
+# Regex to validates piece names.
+PIECE_REGEX = re.compile(r"^[a-z0-9][a-z0-9-]*", re.IGNORECASE)
+
+# Regex to match a constraint specification. Multiple constraints are not 
supported.
+CONSTRAINT_REGEX = re.compile(r"(?:\^|\<|(?:<=)|(?:==)|(?:>=)|\>)[^<>=\^,]+")
+
+# Regex for parsing semantic versions. See
+# 
https://semver.org/#is-there-a-suggested-regular-expression-regex-to-check-a-semver-string
+SEMVER_REGEX = 
re.compile(r"^(?P<major>0|[1-9]\d*)\.(?P<minor>0|[1-9]\d*)\.(?P<patch>0|[1-9]\d*)(?:-(?P<prerelease>(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*)(?:\.(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*))*))?(?:\+(?P<buildmetadata>[0-9a-zA-Z-]+(?:\.[0-9a-zA-Z-]+)*))?$")
+
+
+def validate_requirements_by_piece():
+  problems = []
+
+  unseen_required_pieces = set(REQUIRED_PIECES)
+  seen_pieces = set()
+
+  # Ensure that core is listed first and dev is listed last.
+  saw_core = False
+  saw_dev = False
+
+  if not isinstance(REQUIREMENTS_BY_PIECE, (list, tuple)):
+    problems.append(f"must be list or tuple, see {REQUIREMENTS_BY_PIECE!r}")
+
+  for piece, deps in REQUIREMENTS_BY_PIECE:
+    if not isinstance(piece, str):
+      problems.append(f"key {piece!r}: must be str, see {piece!r}")
+      continue
+
+    if piece in unseen_required_pieces:
+      unseen_required_pieces.remove(piece)
+
+    piece_lower = piece.lower()
+    if piece_lower in seen_pieces:
+      problems.append(f"piece {piece}: listed twice")
+
+    seen_pieces.add(piece_lower)
+
+    if not saw_core and piece != "core":
+      problems.append(f'must list "core" before {piece}')
+    elif piece == "core":
+      saw_core = True
+
+    if saw_dev:
+      problems.append(f'must list "dev" last')
+    elif piece == "dev":
+      saw_dev = True
+
+    if not isinstance(deps, (list, tuple)):
+      problems.append(f'value for key "{piece}" should be list or tuple, see 
{deps!r}')
+      continue
+
+    if list(sorted(deps)) != list(deps):
+      problems.append(f"deps for key {piece} must be sorted. Correct order:\n  
{list(sorted(deps))!r}")
+
+    piece_deps = set()
+    for d in deps:
+      if CONSTRAINT_REGEX.search(d):
+        problems.append(f"for piece {piece}: dependency {d} should not specify 
a version. "
+                        "Add it to CONSTRAINTS instead.")
+
+      if d.lower() in piece_deps:
+        problems.append(f'for piece {piece}: dependency {d} listed twice')
+
+      piece_deps.add(d.lower())
+
+  extras_pieces = [k for (k, _) in REQUIREMENTS_BY_PIECE if k not in ("dev", 
"core")]
+  sorted_extras_pieces = list(sorted(extras_pieces))
+  if sorted_extras_pieces != list(extras_pieces):
+    problems.append('pieces other than "core" and "dev" must appear in 
alphabetical order'
+                    f"{sorted_extras_pieces}")
+
+  return problems
+
+
+def parse_semver(package, constraint, problems):
+  """Parse a semantic versioning constraint of the form "^X.[.Y[.Z[...]]]]"
+
+  Parameters
+  ----------
+  package : str
+      Name of the package specifying this constraint, for reporting problems.
+  constraint : str
+      The semver constraint. Must start with "^"
+  problems : List[str]
+      A list of strings describing problems that have occurred validating the 
configuration.
+      Problems encountered while validating constraint are appended to this 
list.
+
+  Returns
+  -------
+  List[str], int :
+      A 2-tuple. The first element is a list containing an entry for each 
component in the
+      semver string (components separated by "."). The second element is the 
index of the
+      component in the list which must not change to meet the semver 
constraint.
+
+      See "Caret requirements" at https://python-poetry.org/docs/versions/.
+  """
+  m = SEMVER_REGEX.match(constraint[1:])
+  if not m:
+    problems.append(f"{package}: invalid semver constraint {constraint}")
+    return [], 0
+
+  min_ver_parts = list(m.groups())
+
+  # Remove the end
+  while min_ver_parts and min_ver_parts[-1] is None or not 
min_ver_parts[-1].strip():
+    min_ver_parts.pop()
+
+  for i, p in enumerate(min_ver_parts):
+    try:
+      x = int(p.strip())
+    except ValueError as p:
+      if i == len(parts) - 1 and i > 0:
+        # If a pre-release tag is specified (i.e. 1.2.0pre3), allow.
+        return min_ver_parts, i - 1
+
+      problems.append(
+        f"{package}: semver constraint with non-numeric leading component: 
{constraint}")
+      return [], 0
+
+    if x:
+      return min_ver_parts, i
+
+  else:
+    # All 0's
+    return min_ver_parts, 0
+
+
+def validate_constraints():
+  problems = []
+
+  if not isinstance(CONSTRAINTS, (list, tuple)):
+    problems.append(f"must be list or tuple, see: {CONSTRAINTS!r}")

Review comment:
       This would be an unnecessary check if you used Python type annotations.

##########
File path: python/requirements/all.txt
##########
@@ -0,0 +1,16 @@
+numpy

Review comment:
       I'd recommend adding comments at the top of each of these files to 
indicate what they are used for, since it may not always be obvious from the 
filename. PIP requirements files support `#` 
comments.https://pip.pypa.io/en/latest/reference/pip_install/#requirements-file-format

##########
File path: python/gen_requirements.py
##########
@@ -0,0 +1,391 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""TVM Python requriements.txt generator.
+
+This script generates a set of requirements.txt files (stored in 
`./requirements`) that describe
+TVM's Python dependencies.
+
+## Pieces
+
+TVM can be roughly broken into these named pieces along the lines of Python 
dependencies:
+
+- "core": A core piece, which is intended to be buildable with very few 
external dependencies. Users
+  can use Relay, compile models, and run autotuning with this part.
+- "importer-<tool>": Model importers, which convert models defined in various 
other tools (i.e.
+  TensorFlow, PyTorch, etc) into Relay models.
+- Extra features (i.e. XGBoost in AutoTVM). These enhance TVM's functionality, 
but aren't required
+  for basic operation.
+
+## What this tool does
+
+From these pieces, this tool builds:
+ - requirements/<name>.txt - Python dependencies for each named piece above, 
`<name>` is the same as
+   the quoted piece name.
+ - requirements/all.txt - Consolidated Python dependencies for all pieces, 
excluding dev below.
+ - requirements/dev.txt - Python dependencies needed to develop TVM, such as 
lint and test tools.
+
+The data representing each piece is contained in the two maps below.
+"""
+
+import argparse
+import collections
+import os
+import re
+import textwrap
+import sys
+
+# Maps named TVM piece (see description above) to a list of names of Python 
packages. Please use
+# alphabetical order for each package list, and do not add version constraints 
here!
+REQUIREMENTS_BY_PIECE = [
+    # Base requirements needed to install tvm with no extras.
+    ("core", [
+        "attrs",
+        "decorator",
+        "numpy",
+        "psutil",
+        "scipy",
+        "synr",
+    ]),
+
+    # Relay frontends.
+    ("importer-caffe2", ["torch"]),
+    ("importer-coreml", ["coremltools"]),
+    ("importer-darknet", ["opencv-python"]),
+    ("importer-keras", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-onnx", ["future", "onnx", "onnxruntime", "torch", 
"torchvision"]),
+    ("importer-pytorch", ["future", "torch", "torchvision"]),
+    ("importer-tensorflow", ["tensorflow", "tensorflow-estimator"]),
+    ("importer-tflite", ["tensorflow", "tensorflow-estimator", "tflite"]),
+
+    ("tvmc", ["onnx", "onnxruntime", "tensorflow", "tflite", "torch", 
"torchvision"]),
+
+    # XGBoost, useful for autotuning on some targets.
+    ("xgboost", ["torch"]),
+
+    # Development requirements
+    ("dev", ["matplotlib", "pillow"]),
+]
+
+# Maps a named Python package (which should appear in REQUIREMENTS_BY_PIECE 
above) to a
+# semver or pip version constraint. Semver constraints are translated into 
requirements.txt
+# constraints.
+CONSTRAINTS = [
+  ("onnx", ">=1.7.0"),
+  ("onnxruntime", ">=1.0.0"),
+  ("pillow", "<7"),
+  ("synr", ">=0.2.1"),
+  ("tensorflow", ">=2.1.0"),
+  ("tflite", ">=2.1.0"),
+  ("torch", "^1.7.0"),
+  ("torchvision", ">=0.5.0"),
+]
+
+################################################################################
+# End of configuration options.
+################################################################################
+
+
+
+
+# Required keys in REQUIREMENTS_BY_PIECE.
+REQUIRED_PIECES = ["core", "dev"]
+
+# Regex to validates piece names.
+PIECE_REGEX = re.compile(r"^[a-z0-9][a-z0-9-]*", re.IGNORECASE)
+
+# Regex to match a constraint specification. Multiple constraints are not 
supported.
+CONSTRAINT_REGEX = re.compile(r"(?:\^|\<|(?:<=)|(?:==)|(?:>=)|\>)[^<>=\^,]+")
+
+# Regex for parsing semantic versions. See
+# 
https://semver.org/#is-there-a-suggested-regular-expression-regex-to-check-a-semver-string
+SEMVER_REGEX = 
re.compile(r"^(?P<major>0|[1-9]\d*)\.(?P<minor>0|[1-9]\d*)\.(?P<patch>0|[1-9]\d*)(?:-(?P<prerelease>(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*)(?:\.(?:0|[1-9]\d*|\d*[a-zA-Z-][0-9a-zA-Z-]*))*))?(?:\+(?P<buildmetadata>[0-9a-zA-Z-]+(?:\.[0-9a-zA-Z-]+)*))?$")
+
+
+def validate_requirements_by_piece():
+  problems = []
+
+  unseen_required_pieces = set(REQUIRED_PIECES)
+  seen_pieces = set()
+
+  # Ensure that core is listed first and dev is listed last.
+  saw_core = False
+  saw_dev = False
+
+  if not isinstance(REQUIREMENTS_BY_PIECE, (list, tuple)):
+    problems.append(f"must be list or tuple, see {REQUIREMENTS_BY_PIECE!r}")
+
+  for piece, deps in REQUIREMENTS_BY_PIECE:
+    if not isinstance(piece, str):
+      problems.append(f"key {piece!r}: must be str, see {piece!r}")
+      continue
+
+    if piece in unseen_required_pieces:
+      unseen_required_pieces.remove(piece)
+
+    piece_lower = piece.lower()
+    if piece_lower in seen_pieces:
+      problems.append(f"piece {piece}: listed twice")
+
+    seen_pieces.add(piece_lower)
+
+    if not saw_core and piece != "core":
+      problems.append(f'must list "core" before {piece}')
+    elif piece == "core":
+      saw_core = True
+
+    if saw_dev:
+      problems.append(f'must list "dev" last')
+    elif piece == "dev":
+      saw_dev = True
+
+    if not isinstance(deps, (list, tuple)):
+      problems.append(f'value for key "{piece}" should be list or tuple, see 
{deps!r}')
+      continue
+
+    if list(sorted(deps)) != list(deps):
+      problems.append(f"deps for key {piece} must be sorted. Correct order:\n  
{list(sorted(deps))!r}")
+
+    piece_deps = set()
+    for d in deps:
+      if CONSTRAINT_REGEX.search(d):
+        problems.append(f"for piece {piece}: dependency {d} should not specify 
a version. "
+                        "Add it to CONSTRAINTS instead.")
+
+      if d.lower() in piece_deps:
+        problems.append(f'for piece {piece}: dependency {d} listed twice')
+
+      piece_deps.add(d.lower())
+
+  extras_pieces = [k for (k, _) in REQUIREMENTS_BY_PIECE if k not in ("dev", 
"core")]
+  sorted_extras_pieces = list(sorted(extras_pieces))
+  if sorted_extras_pieces != list(extras_pieces):
+    problems.append('pieces other than "core" and "dev" must appear in 
alphabetical order'
+                    f"{sorted_extras_pieces}")
+
+  return problems
+
+
+def parse_semver(package, constraint, problems):
+  """Parse a semantic versioning constraint of the form "^X.[.Y[.Z[...]]]]"
+
+  Parameters
+  ----------
+  package : str
+      Name of the package specifying this constraint, for reporting problems.
+  constraint : str
+      The semver constraint. Must start with "^"
+  problems : List[str]
+      A list of strings describing problems that have occurred validating the 
configuration.
+      Problems encountered while validating constraint are appended to this 
list.
+
+  Returns
+  -------
+  List[str], int :
+      A 2-tuple. The first element is a list containing an entry for each 
component in the
+      semver string (components separated by "."). The second element is the 
index of the
+      component in the list which must not change to meet the semver 
constraint.
+
+      See "Caret requirements" at https://python-poetry.org/docs/versions/.
+  """
+  m = SEMVER_REGEX.match(constraint[1:])
+  if not m:
+    problems.append(f"{package}: invalid semver constraint {constraint}")
+    return [], 0
+
+  min_ver_parts = list(m.groups())
+
+  # Remove the end
+  while min_ver_parts and min_ver_parts[-1] is None or not 
min_ver_parts[-1].strip():
+    min_ver_parts.pop()
+
+  for i, p in enumerate(min_ver_parts):
+    try:
+      x = int(p.strip())
+    except ValueError as p:
+      if i == len(parts) - 1 and i > 0:
+        # If a pre-release tag is specified (i.e. 1.2.0pre3), allow.
+        return min_ver_parts, i - 1
+
+      problems.append(
+        f"{package}: semver constraint with non-numeric leading component: 
{constraint}")
+      return [], 0
+
+    if x:
+      return min_ver_parts, i
+
+  else:
+    # All 0's
+    return min_ver_parts, 0
+
+
+def validate_constraints():
+  problems = []
+
+  if not isinstance(CONSTRAINTS, (list, tuple)):
+    problems.append(f"must be list or tuple, see: {CONSTRAINTS!r}")
+
+  seen_packages = set()
+  all_deps = set()
+  for _, deps in REQUIREMENTS_BY_PIECE:
+    for d in deps:
+      all_deps.add(d.lower())
+
+  for package, constraint in CONSTRAINTS:
+    if package in seen_packages:
+      problems.append(f"{package}: specified twice")
+
+    if package.lower() not in all_deps:
+      problems.append(f"{package}: not specified in REQUIREMENTS_BY_PIECE")
+
+    if not CONSTRAINT_REGEX.match(constraint):
+      problems.append(f'{package}: constraint "{constraint}" does not look 
like a valid constraint')
+
+    if constraint.startswith("^"):
+      parse_semver(package, constraint, problems)
+
+  all_constrained_packages = [p for (p, _) in CONSTRAINTS]
+  sorted_constrained_packages = list(sorted(all_constrained_packages))
+  if sorted_constrained_packages != all_constrained_packages:
+    problems.append("CONSTRAINTS entries should be in this sorted order: "
+                    f'{sorted_constrained_packages}')
+
+  return problems
+
+
+class ValidationError(Exception):
+  """Raised when a validation error occurs."""
+
+  @staticmethod
+  def format_problems(config, problems):
+    formatted = []
+    for p in problems:
+      assert isinstance(p, str), f"problems element not a str: {p}"
+      formatted.append('\n'.join(
+        textwrap.wrap(f"{config}: {p}", width=80, initial_indent=" * ", 
subsequent_indent="   ")))
+
+    return '\n'.join(formatted)
+
+  def __init__(self, config, problems):
+    super(ValidationError, self).__init__(self.format_problems(config, 
problems))
+    self.problems = problems
+
+
+def validate_or_raise():
+  problems = validate_requirements_by_piece()
+  if problems:
+    raise ValidationError("REQUIREMENTS_BY_PIECE", problems)
+
+  problems = validate_constraints()
+  if problems:
+    raise ValidationError("CONSTRAINTS", problems)
+
+
+def semver_to_requirements(piece, dep, constraint, joined_deps):
+  problems = []
+  min_ver_parts, fixed_index = parse_semver(dep, constraint, problems)
+  assert not problems
+
+  # i is now the index of the version component which must not change.
+  try:
+    fixed_part = int(min_ver_parts[fixed_index])
+  except ValueError:
+    problems.append(
+      f"piece {piece}: dependency {dep} has semver constraint with non-integer 
leading parts: {ver}")
+    return
+
+  max_ver_parts = (min_ver_parts[:fixed_index] +
+                   [str(int(min_ver_parts[fixed_index]) + 1)] +
+                   ["0" for _ in min_ver_parts[fixed_index + 1:]])
+  
joined_deps.append(f'{dep}>={".".join(min_ver_parts)},<{".".join(max_ver_parts)}')
+
+
+def join_requirements():
+  """Validate, then join REQUIRMENTS_BY_PIECE against CONSTRAINTS and return 
the result.
+
+  Returns
+  -------
+  An OrderedDict containing REQUIREMENTS_BY_PIECE, except any dependency 
mentioned in CONSTRAINTS
+  is replaced by a setuptools-compatible constraint.
+  """
+  validate_or_raise()
+
+  constraints_map = collections.OrderedDict(
+    [(p.lower(), c) for (p, c) in CONSTRAINTS])
+
+  to_return = collections.OrderedDict()
+  all_deps = set()
+  for piece, deps in REQUIREMENTS_BY_PIECE:
+    joined_deps = []
+    for d in deps:
+      constraint = constraints_map.get(d.lower())
+      if constraint is None:
+        joined_deps.append(d)
+        continue
+
+      if constraint[0] == "^":
+        # Translate semver to requirements:
+        semver_to_requirements(piece, d, constraint, joined_deps)
+      else:
+        joined_deps.append(f"{d}{constraint}")
+
+    if piece != "dev":
+      all_deps.update(joined_deps)
+
+    to_return[piece] = joined_deps
+
+  to_return["all"] = all_deps
+
+  return to_return
+
+
+def parse_args():
+  parser = argparse.ArgumentParser()
+  parser.add_argument("--lint", action="store_true",
+                      help="Just lint dependencies, don't generate anything")
+  return parser.parse_args()
+
+
+def main():
+  args = parse_args()
+  try:
+    joined_deps = join_requirements()
+  except ValidationError as e:
+    print(f"ERROR: invalid requirements configuration in {__file__}:", 
file=sys.stderr)
+    print(str(e), file=sys.stderr)
+    sys.exit(2)
+
+  if args.lint:
+    sys.exit(0)

Review comment:
       Recommend `return`, not `exit`, since this is a function that could be 
(and, in fact, is!) invoked by another Python library -- same for the error 
cases, raise an Exception, don't exit.

##########
File path: python/setup.py
##########
@@ -171,38 +171,25 @@ def get_package_data_files():
     return ["relay/std/prelude.rly", "relay/std/core.rly"]
 
 
+# Temporarily add this directory to the path so we can import the requirements 
generator
+# tool.
+sys.path.insert(0, os.path.dirname(__file__))
+import gen_requirements
+sys.path.pop(0)
+
+requirements = gen_requirements.join_requirements()

Review comment:
       Do you want to print out some details on what the requirements 
identified are, to help with debugging?




----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


Reply via email to