-
Notifications
You must be signed in to change notification settings - Fork 20
/
Copy pathsetup.py
208 lines (176 loc) · 8.92 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
"""
Build / install instructions:
- use a virtual env (conda or whatever you want)
- install pytorch nightly (https://pytorch.org/get-started/locally/)
- pip install -e . --no-build-isolation
Note:
The "torch" package is not just a runtime dependency but also a *build time*
dependency, since we are including pytorch's headers. We are however not
specifying either of these dependencies in our pyproject.toml file.
Why we don't specify torch as a runtime dep: I'm not 100% sure, all I know is
that no project does it and those who tried had tons of problems. I think it has
to do with the fact that there are different flavours of torch (cpu, cuda, etc.)
and the pyproject.toml system does not allow a fine-grained enough control over
that.
Why we don't specify torch as a build time dep: because really developers need
to rely on torch-nightly, not on the stable version of torch. And the only way
to install torch nightly is to specify a custom `--index-url` and sadly
pyproject.toml does not allow that.
To be perfeclty honest I'm not 110% sure about the above, but this is definitely
fine for now. Basically what that means is that we expect developers and users
to install the correct version of torch before they install / build torchcodec.
This is what all other libraries expect as well.
Oh, and by default, doing `pip install -e .` would try to build the package in
an isolated virtual environment, not in the current one. But because we're not
specifying torch as a build-time dependency, this fails loudly as torch can't be
found. That's why we're passing `--no-build-isolation`: this tells pip to build
the package within the current virtual env, where torch would have already been
installed.
"""
import os
import subprocess
import sys
from pathlib import Path
import torch
from setuptools import Extension, setup
from setuptools.command.build_ext import build_ext
_ROOT_DIR = Path(__file__).parent.resolve()
class CMakeBuild(build_ext):
def __init__(self, *args, **kwargs):
self._install_prefix = None
super().__init__(*args, **kwargs)
def run(self):
try:
subprocess.check_output(["cmake", "--version"])
except OSError:
raise RuntimeError("CMake is not available.") from None
super().run()
def build_extension(self, ext):
"""Call our CMake build system to build libtorchcodec?.so"""
# Setuptools was designed to build one extension (.so file) at a time,
# calling this method for each Extension object. We're using a
# CMake-based build where all our extensions are built together at once.
# If we were to declare one Extension object per .so file as in a
# standard setup, a) we'd have to keep the Extensions names in sync with
# the CMake targets, and b) we would be calling into CMake for every
# single extension: that's overkill and inefficient, since CMake builds
# all the extensions at once. To avoid all that we create a *single*
# fake Extension which triggers the CMake build only once.
assert ext.name == "FAKE_NAME", f"Unexpected extension name: {ext.name}"
# The price to pay for our non-standard setup is that we have to tell
# setuptools *where* those extensions are expected to be within the
# source tree (for sdists or editable installs) or within the wheel.
# Normally, setuptools relies on the extension's name to figure that
# out, e.g. an extension named `torchcodec.libtorchcodec.so` would be
# placed in `torchcodec/` and importable from `torchcodec.`. From that,
# setuptools knows how to move the extensions from their temp build
# directories back into the proper dir.
# Our fake extension's name is just a placeholder, so we have to handle
# that relocation logic ourselves.
# _install_prefix is the temp directory where the built extension(s)
# will be "installed" by CMake. Once they're copied to install_prefix,
# the built .so files still need to be copied back into:
# - the source tree (for editable installs) - this is handled in
# copy_extensions_to_source()
# - the (temp) wheel directory (when building a wheel). I cannot tell
# exactly *where* this is handled, but for this to work we must
# prepend the "/torchcodec" folder to _install_prefix: this tells
# setuptools to eventually move those .so files into `torchcodec/`.
# It may seem overkill to 'cmake install' the extensions in a temp
# directory and move them back to another dir, but this is what
# setuptools would do and expect even in a standard build setup.
self._install_prefix = (
Path(self.get_ext_fullpath(ext.name)).parent.absolute() / "torchcodec"
)
self._build_all_extensions_with_cmake()
def _build_all_extensions_with_cmake(self):
# Note that self.debug is True when you invoke setup.py like this:
# python setup.py build_ext --debug install
torch_dir = Path(torch.utils.cmake_prefix_path) / "Torch"
cmake_build_type = os.environ.get("CMAKE_BUILD_TYPE", "Release")
enable_cuda = os.environ.get("ENABLE_CUDA", "")
python_version = sys.version_info
cmake_args = [
f"-DCMAKE_INSTALL_PREFIX={self._install_prefix}",
f"-DTorch_DIR={torch_dir}",
"-DCMAKE_VERBOSE_MAKEFILE=ON",
f"-DCMAKE_BUILD_TYPE={cmake_build_type}",
f"-DPYTHON_VERSION={python_version.major}.{python_version.minor}",
f"-DENABLE_CUDA={enable_cuda}",
]
Path(self.build_temp).mkdir(parents=True, exist_ok=True)
subprocess.check_call(
["cmake", str(_ROOT_DIR)] + cmake_args, cwd=self.build_temp
)
subprocess.check_call(["cmake", "--build", "."], cwd=self.build_temp)
subprocess.check_call(["cmake", "--install", "."], cwd=self.build_temp)
def copy_extensions_to_source(self):
"""Copy built extensions from temporary folder back into source tree.
This is called by setuptools at the end of .run() during editable installs.
"""
self.get_finalized_command("build_py")
extension = ""
if sys.platform == "linux":
extension = "so"
elif sys.platform == "darwin":
extension = "dylib"
else:
raise NotImplementedError(
"Platforms other than linux/darwin are not supported yet"
)
for so_file in self._install_prefix.glob(f"*.{extension}"):
assert "libtorchcodec" in so_file.name
destination = Path("src/torchcodec/") / so_file.name
print(f"Copying {so_file} to {destination}")
self.copy_file(so_file, destination, level=self.verbose)
NOT_A_LICENSE_VIOLATION_VAR = "I_CONFIRM_THIS_IS_NOT_A_LICENSE_VIOLATION"
BUILD_AGAINST_ALL_FFMPEG_FROM_S3_VAR = "BUILD_AGAINST_ALL_FFMPEG_FROM_S3"
not_a_license_violation = os.getenv(NOT_A_LICENSE_VIOLATION_VAR) is not None
build_against_all_ffmpeg_from_s3 = (
os.getenv(BUILD_AGAINST_ALL_FFMPEG_FROM_S3_VAR) is not None
)
if "bdist_wheel" in sys.argv and not (
build_against_all_ffmpeg_from_s3 or not_a_license_violation
):
raise ValueError(
"It looks like you're trying to build a wheel. "
f"You probably want to set {BUILD_AGAINST_ALL_FFMPEG_FROM_S3_VAR}. "
f"If you have a good reason *not* to, then set {NOT_A_LICENSE_VIOLATION_VAR}."
)
# See `CMakeBuild.build_extension()`.
fake_extension = Extension(name="FAKE_NAME", sources=[])
def _write_version_files():
if version := os.getenv("BUILD_VERSION"):
# BUILD_VERSION is set by the `test-infra` build jobs. It typically is
# the content of `version.txt` plus some suffix like "+cpu" or "+cu112".
# See
# https://github.com/pytorch/test-infra/blob/61e6da7a6557152eb9879e461a26ad667c15f0fd/tools/pkg-helpers/pytorch_pkg_helpers/version.py#L113
with open(_ROOT_DIR / "version.txt", "w") as f:
f.write(f"{version}")
else:
with open(_ROOT_DIR / "version.txt") as f:
version = f.readline().strip()
try:
sha = (
subprocess.check_output(
["git", "rev-parse", "HEAD"], cwd=str(_ROOT_DIR)
)
.decode("ascii")
.strip()
)
version += "+" + sha[:7]
except Exception:
print("INFO: Didn't find sha. Is this a git repo?")
with open(_ROOT_DIR / "src/torchcodec/version.py", "w") as f:
f.write("# Note that this file is generated during install.\n")
f.write(f"__version__ = '{version}'\n")
_write_version_files()
setup(
ext_modules=[fake_extension],
cmdclass={"build_ext": CMakeBuild},
)