forked from databricks/megablocks
-
Notifications
You must be signed in to change notification settings - Fork 1
/
setup.py
67 lines (58 loc) · 1.65 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
from setuptools import setup, find_packages
import os
import torch
from torch.utils.cpp_extension import BuildExtension, CUDAExtension
if os.environ.get("TORCH_CUDA_ARCH_LIST"):
# Let PyTorch builder to choose device to target for.
device_capability = ""
else:
device_capability = torch.cuda.get_device_capability()
device_capability = f"{device_capability[0]}{device_capability[1]}"
nvcc_flags = [
"--ptxas-options=-v",
"--optimize=2",
]
if device_capability:
nvcc_flags.append(
f"--generate-code=arch=compute_{device_capability},code=sm_{device_capability}"
)
ext_modules = [
CUDAExtension(
"megablocks_ops",
["csrc/ops.cu"],
include_dirs=["csrc"],
extra_compile_args={"cxx": ["-fopenmp"], "nvcc": nvcc_flags},
)
]
install_requires=[
"triton>=2.1.0",
"stanford-stk>=0.0.6",
]
extra_deps = {}
extra_deps["gg"] = [
"grouped_gemm",
]
extra_deps["dev"] = [
"absl-py",
]
extra_deps['all'] = set(dep for deps in extra_deps.values() for dep in deps)
setup(
name="megablocks",
version="0.5.1",
author="Trevor Gale",
author_email="[email protected]",
description="MegaBlocks",
long_description=open('README.md').read(),
long_description_content_type='text/markdown',
url="https://github.com/stanford-futuredata/megablocks",
classifiers=[
"Programming Language :: Python :: 3",
"License :: OSI Approved :: BSD License",
"Operating System :: Unix",
],
packages=find_packages(),
ext_modules=ext_modules,
cmdclass={"build_ext": BuildExtension},
install_requires=install_requires,
extras_require=extra_deps,
)