-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbuild.py
307 lines (276 loc) · 10.2 KB
/
build.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
import multiprocessing
import os
import platform
import shutil
import subprocess
from contextlib import contextmanager
from pathlib import Path
from typing import Any
from typing import List
import pysam
from Cython.Build import cythonize
from Cython.Distutils.build_ext import new_build_ext as cython_build_ext
from setuptools import Distribution
from setuptools import Extension
def strtobool(value: str) -> bool:
"""Equivalent to distutils strtobool."""
value = value.lower()
trues = {"y", "yes", "t", "true", "on", "1"}
falses = {"n", "no", "f", "false", "off", "0"}
if value in trues:
return True
elif value in falses:
return False
raise ValueError(f"'{value}' is not a valid bool value")
@contextmanager
def changedir(path: str) -> Any:
"""Changes the directory before, and moves back to the original directory after."""
save_dir = os.getcwd()
os.chdir(path)
try:
yield
finally:
os.chdir(save_dir)
USE_GIT: bool = shutil.which("git") is not None and Path(".git").exists() and Path(".git").is_dir()
IS_DARWIN = platform.system() == "Darwin"
def compile_htslib() -> None:
"""Complies htslib prior to entering the context."""
print("Building htslib...")
with changedir("htslib"):
cflags = "CFLAGS='-fpic -fvisibility=hidden -g -Wall -O2"
if IS_DARWIN:
cflags += " -mmacosx-version-min=11.0"
cflags += "'"
commands = [
"autoreconf -i",
f"./configure --with-libdeflate --enable-lzma --enable-bz2 {cflags}",
"make -j",
]
for command in commands:
retcode = subprocess.call(
f"{command}", stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, shell=True
)
if retcode != 0: # run again for debugging
retcode = subprocess.call(f"{command}", shell=True)
if retcode != 0:
raise RuntimeError(f"Failed to run command {command}")
@contextmanager
def with_patches() -> Any:
"""Applies patches to bwa, then cleans up after exiting the context."""
patches = sorted([
os.path.abspath(patch)
for patch in Path("patches").iterdir()
if patch.is_file() and patch.suffix == ".patch"
])
with changedir("bwa"):
print("Patching bwa...")
for patch in patches:
if USE_GIT:
retcode = subprocess.call(f"git apply --whitespace=nowarn {patch}", shell=True)
else:
retcode = subprocess.call(f"patch -p1 < {patch}", shell=True)
if retcode != 0:
raise RuntimeError(f"Failed to apply patch {patch}")
try:
yield
finally:
if USE_GIT:
commands = ["git submodule deinit -f bwa", "git submodule update --init --recursive"]
for command in commands:
retcode = subprocess.call(command, shell=True)
if retcode != 0:
raise RuntimeError(f"Failed to reset bwa submodule: {command}")
compiler_directives = {
"language_level": "3",
"embedsignature": True,
}
SOURCE_DIR = Path("pybwa")
BUILD_DIR = Path("cython_build")
compile_args: list[str] = []
link_args: list[str] = []
include_dirs = ["htslib", "bwa", "pybwa", os.path.dirname(pysam.__file__)]
libraries = ["m", "z", "pthread", "lzma", "bz2", "curl", "deflate"]
if platform.system() == "Linux":
libraries.append("rt")
library_dirs = ["pybwa", "bwa", "htslib"]
extra_objects = ["htslib/libhts.a"]
define_macros = [
("HAVE_PTHREAD", None),
("USE_MALLOC_WRAPPERS", None),
("USE_HTSLIB", "1"),
]
h_files: list[str] = []
c_files: list[str] = []
exclude_files = {
"pybwa": {"libbwaaln.c", "libbwaindex.c", "libbwamem.c"},
"bwa": {"example.c", "main.c", "kstring.c", "kstring.h"},
}
for root_dir in library_dirs:
if root_dir == "htslib": # these are added via extra_objects above
continue
exc: set[str] = exclude_files.get(root_dir, set())
h_files.extend(
str(x) for x in Path(root_dir).rglob("*.h") if "tests/" not in x.parts and x.name not in exc
)
c_files.extend(
str(x) for x in Path(root_dir).rglob("*.c") if "tests/" not in x.parts and x.name not in exc
)
# Check if we should build with linetracing for coverage
build_with_coverage = os.environ.get("CYTHON_TRACE", "false").lower() in ("1", "true", "'true'")
if build_with_coverage:
compiler_directives["linetrace"] = True
compiler_directives["emit_code_comments"] = True
define_macros.extend([
("CYTHON_TRACE", "1"),
("CYTHON_TRACE_NOGIL", "1"),
("DCYTHON_USE_SYS_MONITORING", "0"),
])
BUILD_DIR = Path(".") # the compiled .c files need to be next to the .pyx files for coverage
if platform.system() != "Windows":
compile_args.extend([
"-Wno-unused-result",
"-Wno-unreachable-code",
"-Wno-single-bit-bitfield-constant-conversion",
"-Wno-deprecated-declarations",
"-Wno-unused",
"-Wno-strict-prototypes",
"-Wno-sign-compare",
"-Wno-error=declaration-after-statement",
"-Wno-implicit-function-declaration",
"-Wno-macro-redefined",
])
libbwaindex_module = Extension(
name="pybwa.libbwaindex",
sources=["pybwa/libbwaindex.pyx"] + c_files,
depends=h_files,
extra_compile_args=compile_args,
extra_link_args=link_args,
extra_objects=extra_objects,
include_dirs=include_dirs,
language="c",
libraries=libraries,
library_dirs=library_dirs,
define_macros=define_macros,
)
libbwaaln_module = Extension(
name="pybwa.libbwaaln",
sources=["pybwa/libbwaaln.pyx"] + c_files,
depends=h_files,
extra_compile_args=compile_args,
extra_link_args=link_args,
extra_objects=extra_objects,
include_dirs=include_dirs,
language="c",
libraries=libraries,
library_dirs=library_dirs,
define_macros=define_macros,
)
libbwamem_module = Extension(
name="pybwa.libbwamem",
sources=["pybwa/libbwamem.pyx"] + c_files,
depends=h_files,
extra_compile_args=compile_args,
extra_link_args=link_args,
extra_objects=extra_objects,
include_dirs=include_dirs,
language="c",
libraries=libraries,
library_dirs=library_dirs,
define_macros=define_macros,
)
def cythonize_helper(extension_modules: List[Extension]) -> Any:
"""Cythonize all Python extensions."""
return cythonize(
module_list=extension_modules,
# Don"t build in source tree (this leaves behind .c files)
build_dir=BUILD_DIR,
# Don"t generate an .html output file. Would contain source.
annotate=False,
# Parallelize our build
nthreads=multiprocessing.cpu_count() * 2,
# Compiler directives (e.g. language, or line tracing for coverage)
compiler_directives=compiler_directives,
# (Optional) Always rebuild, even if files untouched
force=True,
)
CLASSIFIERS = [
"Development Status :: 5 - Production/Stable",
"Environment :: Console",
"Intended Audience :: Developers",
"Intended Audience :: Science/Research",
"License :: OSI Approved :: MIT License",
"Natural Language :: English",
"Operating System :: OS Independent",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Programming Language :: Python :: 3.13",
"Topic :: Scientific/Engineering :: Bio-Informatics",
"Topic :: Software Development :: Documentation",
"Topic :: Software Development :: Libraries :: Python Modules",
"Typing :: Typed",
]
def build() -> None:
"""The main build function for pybwa."""
# compile htslib
compile_htslib()
# apply patches to bwa, then revert them after
with with_patches():
print("Building extensions...")
# Collect and cythonize all files
extension_modules = cythonize_helper([
libbwaindex_module,
libbwaaln_module,
libbwamem_module,
])
packages = ["pybwa", "pybwa.include.bwa", "pybwa.include.patches", "pybwa.include.htslib"]
package_dir = {
"pybwa": "pybwa",
"pybwa.include.bwa": "bwa",
"pybwa.include.patches": "patches",
"pybwa.include.htslib": "htslib",
}
# Use Setuptools to collect files
distribution = Distribution({
"name": "pybwa",
"version": "0.0.1",
"description": "Python bindings for BWA",
"long_description": __doc__,
"long_description_content_type": "text/x-rst",
"author": "Nils Homer",
"author_email": "[email protected]",
"license": "MIT",
"platforms": ["POSIX", "UNIX", "MacOS"],
"classifiers": CLASSIFIERS,
"url": "https://github.com/fulcrumgenomics/pybwa",
"packages": packages,
"package_dir": package_dir,
"package_data": {
"": ["*.pxd", "*.h", "*.c", "py.typed", "*.pyi", "*.patch", "**/*.h", "**/*.c"],
},
"ext_modules": extension_modules,
"cmdclass": {
"build_ext": cython_build_ext,
},
"zip_safe": False,
})
# Grab the build_ext command and copy all files back to source dir.
# Done so Poetry grabs the files during the next step in its build.
build_ext_cmd = distribution.get_command_obj("build_ext")
build_ext_cmd.ensure_finalized()
# Set the value to 1 for "inplace", with the goal to build extensions
# in build directory, and then copy all files back to the source dir
# (under the hood, "copy_extensions_to_source" will be called after
# building the extensions). This is done so Poetry grabs the files
# during the next step in its build.
build_ext_cmd.parallel = strtobool(os.environ.get("BUILD_EXTENSIONS_PARALLEL", "True"))
if build_ext_cmd.parallel:
print("Building cython extensions in parallel")
else:
print("Building cython extensions serially")
build_ext_cmd.inplace = True
build_ext_cmd.run()
if __name__ == "__main__":
build()