This repository has been archived by the owner on May 20, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 296
/
Copy pathPKGBUILD
438 lines (391 loc) · 18.8 KB
/
PKGBUILD
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
# Maintainer: Sven-Hendrik Haase <[email protected]>
# Maintainer: Torsten Keßler <[email protected]>
# Contributor: Stephen Zhang <zsrkmyn at gmail dot com>
_pkgname=pytorch
pkgbase="python-${_pkgname}"
pkgname=("${pkgbase}" "${pkgbase}-opt" "${pkgbase}-cuda" "${pkgbase}-opt-cuda" "${pkgbase}-rocm" "${pkgbase}-opt-rocm")
pkgver=2.0.1
_pkgver=2.0.1
pkgrel=1
_pkgdesc='Tensors and Dynamic neural networks in Python with strong GPU acceleration'
pkgdesc="${_pkgdesc}"
arch=('x86_64')
url="https://pytorch.org"
license=('BSD')
depends=('google-glog' 'gflags' 'opencv' 'openmp' 'nccl' 'pybind11' 'python' 'python-yaml' 'libuv'
'python-numpy' 'python-sympy' 'protobuf' 'ffmpeg4.4' 'python-future' 'qt6-base'
'intel-oneapi-mkl' 'python-typing_extensions' 'numactl')
# Exclude the magma package here and add the corresponding {cuda, rocm/hip} version
# to makedepends of the split packages.
# The magma package does not allow to build the cuda and rocm/hip code at the same time,
# so we need to work with the split packages magma-{cuda,hip}.
makedepends=('python' 'python-setuptools' 'python-yaml' 'python-numpy' 'cmake' 'cuda'
'cudnn' 'git' 'rocm-hip-sdk' 'roctracer' 'miopen'
'ninja' 'pkgconfig' 'doxygen' 'vulkan-headers' 'shaderc')
source=("${_pkgname}-${pkgver}::git+https://github.com/pytorch/pytorch.git#tag=v$_pkgver"
# generated using parse-submodules
"${pkgname}-ARM_NEON_2_x86_SSE::git+https://github.com/intel/ARM_NEON_2_x86_SSE.git"
"${pkgname}-FP16::git+https://github.com/Maratyszcza/FP16.git"
"${pkgname}-FXdiv::git+https://github.com/Maratyszcza/FXdiv.git"
"${pkgname}-NNPACK::git+https://github.com/Maratyszcza/NNPACK.git"
"${pkgname}-PeachPy::git+https://github.com/malfet/PeachPy.git"
"${pkgname}-QNNPACK::git+https://github.com/pytorch/QNNPACK"
"${pkgname}-VulkanMemoryAllocator::git+https://github.com/GPUOpen-LibrariesAndSDKs/VulkanMemoryAllocator.git"
"${pkgname}-XNNPACK::git+https://github.com/google/XNNPACK.git"
"${pkgname}-benchmark::git+https://github.com/google/benchmark.git"
"${pkgname}-cpuinfo::git+https://github.com/pytorch/cpuinfo.git"
"${pkgname}-cub::git+https://github.com/NVlabs/cub.git"
"${pkgname}-cudnn-frontend::git+https://github.com/NVIDIA/cudnn-frontend.git"
"${pkgname}-cutlass::git+https://github.com/NVIDIA/cutlass.git"
"${pkgname}-eigen::git+https://gitlab.com/libeigen/eigen.git"
"${pkgname}-enum34::git+https://github.com/PeachPy/enum34.git"
"${pkgname}-fbgemm::git+https://github.com/pytorch/fbgemm"
"${pkgname}-fbjni::git+https://github.com/facebookincubator/fbjni.git"
"${pkgname}-flatbuffers::git+https://github.com/google/flatbuffers.git"
"${pkgname}-fmt::git+https://github.com/fmtlib/fmt.git"
"${pkgname}-foxi::git+https://github.com/houseroad/foxi.git"
"${pkgname}-gemmlowp::git+https://github.com/google/gemmlowp.git"
"${pkgname}-gloo::git+https://github.com/facebookincubator/gloo"
"${pkgname}-googletest::git+https://github.com/google/googletest.git"
"${pkgname}-ideep::git+https://github.com/intel/ideep"
"${pkgname}-ios-cmake::git+https://github.com/Yangqing/ios-cmake.git"
"${pkgname}-ittapi::git+https://github.com/intel/ittapi.git"
"${pkgname}-json::git+https://github.com/nlohmann/json.git"
"${pkgname}-kineto::git+https://github.com/pytorch/kineto"
"${pkgname}-nccl::git+https://github.com/NVIDIA/nccl"
"${pkgname}-onnx-tensorrt::git+https://github.com/onnx/onnx-tensorrt"
"${pkgname}-onnx::git+https://github.com/onnx/onnx.git"
"${pkgname}-pocketfft::git+https://github.com/mreineck/pocketfft"
"${pkgname}-protobuf::git+https://github.com/protocolbuffers/protobuf.git"
"${pkgname}-psimd::git+https://github.com/Maratyszcza/psimd.git"
"${pkgname}-pthreadpool::git+https://github.com/Maratyszcza/pthreadpool.git"
"${pkgname}-pybind11::git+https://github.com/pybind/pybind11.git"
"${pkgname}-six::git+https://github.com/benjaminp/six.git"
"${pkgname}-sleef::git+https://github.com/shibatch/sleef"
"${pkgname}-tbb::git+https://github.com/01org/tbb"
"${pkgname}-tensorpipe::git+https://github.com/pytorch/tensorpipe.git"
"${pkgname}-zstd::git+https://github.com/facebook/zstd.git"
fix_include_system.patch
use-system-libuv.patch
fix-building-for-torchvision.patch
87773.patch
disable-werror1.patch
disable-werror2.patch
disable-werror3.patch
disable-werror4.patch
ffmpeg4.4.patch
rocblas-batched.patch)
b2sums=('SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'SKIP'
'77f85808e480bd37dfb5f072d565466ae30a8f827f49ef97591fc2fc03bea54944eb1adeaa4a1e3466518a5640f575eda88d15b4c4d549a6f41f0bf4f2cfb086'
'1f7ce593fa9fc62535ca1c3d85c996a73006cc614c7b7258160c3fc53cd52a1cfddcb18baf897f2e1223ecdfee52ca1471b91c9f845368ed6ac51b66f6e0e676'
'fdea0b815d7750a4233c1d4668593020da017aea43cf4cb63b4c00d0852c7d34f0333e618fcf98b8df2185313a2089b8c2e9fe8ec3cfb0bf693598f9c61461a8'
'0a8fc110a306e81beeb9ddfb3a1ddfd26aeda5e3f7adfb0f7c9bc3fd999c2dde62e0b407d3eca573097a53fd97329214e30e8767fb38d770197c7ec2b53daf18'
'844d0b7b39777492a6d456fa845d5399f673b4bb37b62473393449c9ad0c29dca3c33276dc3980f2e766680100335c0acfb69d51781b79575f4da112d9c4018c'
'985e331b2025e1ca5a4fba5188af0900f1f38bd0fd32c9173deb8bed7358af01e387d4654c7e0389e5f98b6f7cbed053226934d180b8b3b1270bdbbb36fc89b2'
'96de2729b29c7ce3e4fdd8008f575d24c2c3ef9f85d6217e607902d7b870ac71b9290fde71e87a68d75bb75ef28eacbf5ce04e071146809ccf1e76a03f97b479'
'eea86bbed0a37e1661035913536456f90e0cd1e687c7e4103011f0688bc8347b6fc2ff82019909c41e7c89ddbc3b80dde641e88abf406f4faebc71b0bb693d25'
'6286b05d5b5143f117363e3ce3c7d693910f53845aeb6f501b3eea64aa71778cb2d7dcd4ac945d5321ef23b4da02446e86dedc6a9b6a998df4a7f3b1ce50550a'
'232d2aca7cae8da511d1451890f8696d47da72276929ac5731a1a1a481d2a515fa7288bf33730d8ea2c892616551a74ca2439b53de6b1dfee156c30919120741')
options=('!lto' '!debug')
get_pyver () {
python -c 'import sys; print(str(sys.version_info[0]) + "." + str(sys.version_info[1]))'
}
prepare() {
cd "${srcdir}/${_pkgname}-${pkgver}"
# generated using parse-submodules
git submodule init
git config submodule."android/libs/fbjni".url "${srcdir}/${pkgname}"-fbjni
git config submodule."third_party/NNPACK".url "${srcdir}/${pkgname}"-NNPACK
git config submodule."third_party/NNPACK_deps/FP16".url "${srcdir}/${pkgname}"-FP16
git config submodule."third_party/NNPACK_deps/FXdiv".url "${srcdir}/${pkgname}"-FXdiv
git config submodule."third_party/NNPACK_deps/psimd".url "${srcdir}/${pkgname}"-psimd
git config submodule."third_party/NNPACK_deps/pthreadpool".url "${srcdir}/${pkgname}"-pthreadpool
git config submodule."third_party/QNNPACK".url "${srcdir}/${pkgname}"-QNNPACK
git config submodule."third_party/VulkanMemoryAllocator".url "${srcdir}/${pkgname}"-VulkanMemoryAllocator
git config submodule."third_party/XNNPACK".url "${srcdir}/${pkgname}"-XNNPACK
git config submodule."third_party/benchmark".url "${srcdir}/${pkgname}"-benchmark
git config submodule."third_party/cpuinfo".url "${srcdir}/${pkgname}"-cpuinfo
git config submodule."third_party/cub".url "${srcdir}/${pkgname}"-cub
git config submodule."third_party/cudnn_frontend".url "${srcdir}/${pkgname}"-cudnn-frontend
git config submodule."third_party/cutlass".url "${srcdir}/${pkgname}"-cutlass
git config submodule."third_party/eigen".url "${srcdir}/${pkgname}"-eigen
git config submodule."third_party/fbgemm".url "${srcdir}/${pkgname}"-fbgemm
git config submodule."third_party/flatbuffers".url "${srcdir}/${pkgname}"-flatbuffers
git config submodule."third_party/fmt".url "${srcdir}/${pkgname}"-fmt
git config submodule."third_party/foxi".url "${srcdir}/${pkgname}"-foxi
git config submodule."third_party/gemmlowp/gemmlowp".url "${srcdir}/${pkgname}"-gemmlowp
git config submodule."third_party/gloo".url "${srcdir}/${pkgname}"-gloo
git config submodule."third_party/googletest".url "${srcdir}/${pkgname}"-googletest
git config submodule."third_party/ideep".url "${srcdir}/${pkgname}"-ideep
git config submodule."third_party/ios-cmake".url "${srcdir}/${pkgname}"-ios-cmake
git config submodule."third_party/ittapi".url "${srcdir}/${pkgname}"-ittapi
git config submodule."third_party/kineto".url "${srcdir}/${pkgname}"-kineto
git config submodule."third_party/nccl/nccl".url "${srcdir}/${pkgname}"-nccl
git config submodule."third_party/neon2sse".url "${srcdir}/${pkgname}"-ARM_NEON_2_x86_SSE
git config submodule."third_party/nlohmann".url "${srcdir}/${pkgname}"-json
git config submodule."third_party/onnx".url "${srcdir}/${pkgname}"-onnx
git config submodule."third_party/onnx-tensorrt".url "${srcdir}/${pkgname}"-onnx-tensorrt
git config submodule."third_party/pocketfft".url "${srcdir}/${pkgname}"-pocketfft
git config submodule."third_party/protobuf".url "${srcdir}/${pkgname}"-protobuf
git config submodule."third_party/pybind11".url "${srcdir}/${pkgname}"-pybind11
git config submodule."third_party/python-enum".url "${srcdir}/${pkgname}"-enum34
git config submodule."third_party/python-peachpy".url "${srcdir}/${pkgname}"-PeachPy
git config submodule."third_party/python-six".url "${srcdir}/${pkgname}"-six
git config submodule."third_party/sleef".url "${srcdir}/${pkgname}"-sleef
git config submodule."third_party/tbb".url "${srcdir}/${pkgname}"-tbb
git config submodule."third_party/tensorpipe".url "${srcdir}/${pkgname}"-tensorpipe
git config submodule."third_party/zstd".url "${srcdir}/${pkgname}"-zstd
git -c protocol.file.allow=always submodule update --init --recursive
# Fix include with GCC 12
sed "1i#include <mutex>" -i third_party/kineto/libkineto/src/RoctracerActivityApi.h
# https://bugs.archlinux.org/task/64981
patch -N torch/utils/cpp_extension.py "${srcdir}"/fix_include_system.patch
# Use system libuv
patch -Np1 -i "${srcdir}"/use-system-libuv.patch
# fix https://github.com/pytorch/vision/issues/3695
patch -Np1 -i "${srcdir}/fix-building-for-torchvision.patch"
# Fix building against glog 0.6
patch -Np1 -i "${srcdir}/87773.patch"
# Disable -Werror
patch -Np1 -d third_party/fbgemm -i "${srcdir}/disable-werror1.patch"
patch -Np1 -d third_party/benchmark -i "${srcdir}/disable-werror2.patch"
patch -Np1 -d third_party/ideep/mkl-dnn -i "${srcdir}/disable-werror3.patch"
patch -Np1 -i "${srcdir}/disable-werror4.patch"
# build against ffmpeg4.4
patch -Np1 -i "${srcdir}/ffmpeg4.4.patch"
# fix https://github.com/pytorch/pytorch/issues/97640
patch -Np1 -i "${srcdir}/rocblas-batched.patch"
cd "${srcdir}"
cp -r "${_pkgname}-${pkgver}" "${_pkgname}-${pkgver}-opt"
cp -r "${_pkgname}-${pkgver}" "${_pkgname}-${pkgver}-cuda"
cp -r "${_pkgname}-${pkgver}" "${_pkgname}-${pkgver}-opt-cuda"
cp -r "${_pkgname}-${pkgver}" "${_pkgname}-${pkgver}-rocm"
cp -r "${_pkgname}-${pkgver}" "${_pkgname}-${pkgver}-opt-rocm"
}
# Common build configuration, called in all package() functions.
_prepare() {
export VERBOSE=1
export PYTORCH_BUILD_VERSION="${pkgver}"
export PYTORCH_BUILD_NUMBER=1
# Check tools/setup_helpers/cmake.py, setup.py and CMakeLists.txt for a list of flags that can be set via env vars.
export ATEN_NO_TEST=ON # do not build ATen tests
export USE_MKLDNN=ON
export BUILD_CUSTOM_PROTOBUF=OFF
export BUILD_CAFFE2=ON
export BUILD_CAFFE2_OPS=ON
# export BUILD_SHARED_LIBS=OFF
export USE_FFMPEG=ON
export USE_GFLAGS=ON
export USE_GLOG=ON
export USE_VULKAN=ON
export BUILD_BINARY=ON
export USE_OBSERVERS=ON
export USE_OPENCV=ON
# export USE_SYSTEM_LIBS=ON # experimental, not all libs present in repos
export USE_SYSTEM_NCCL=ON
export NCCL_VERSION=$(pkg-config nccl --modversion)
export NCCL_VER_CODE=$(sed -n 's/^#define NCCL_VERSION_CODE\s*\(.*\).*/\1/p' /usr/include/nccl.h)
# export BUILD_SPLIT_CUDA=ON # modern preferred build, but splits libs and symbols, ABI break
# export USE_FAST_NVCC=ON # parallel build with nvcc, spawns too many processes
export USE_CUPTI_SO=ON # make sure cupti.so is used as shared lib
export CC=/usr/bin/gcc-12
export CXX=/usr/bin/g++-12
export CUDAHOSTCXX=/opt/cuda/bin/g++
export CUDA_HOST_COMPILER="${CUDAHOSTCXX}"
export CUDA_HOME=/opt/cuda
# hide build-time CUDA devices
export CUDA_VISIBLE_DEVICES=""
export CUDNN_LIB_DIR=/usr/lib
export CUDNN_INCLUDE_DIR=/usr/include
export TORCH_NVCC_FLAGS="-Xfatbin -compress-all"
# CUDA arch 8.7 is not supported (needed by Jetson boards, etc.)
export TORCH_CUDA_ARCH_LIST="5.2;5.3;6.0;6.1;6.2;7.0;7.2;7.5;8.0;8.6;8.9;9.0;9.0+PTX" #include latest PTX for future compat
export OVERRIDE_TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST}"
export PYTORCH_ROCM_ARCH="gfx803;gfx900;gfx906;gfx908;gfx90a;gfx1030"
# Hack to make sure that the generated dnnl_config.h from onednn can be inlcuded.
export CXXFLAGS="${CXXFLAGS} -I third_party/ideep/mkl-dnn/third_party/oneDNN/include/"
}
#
# Important note on the missing build() function
#
# We build the pytorch packages for the different backends directly in
# corresponding package() functions. This change became necessary when
# merging the two different GPU backends (CUDA and ROCm) into one package.
# Both share a dependency on the magma package but compiled against
# different GPU backends. This leads to two incompatible magma-{cuda,hip}
# packages that cannot be installed side-by-side.
# Therefore, we need to separately add magma-{cuda,hip} as (make-) dependencies
# of pytorch-{cuda,rocm}.
_package() {
# Prevent setup.py from re-running CMake and rebuilding
sed -e 's/RUN_BUILD_DEPS = True/RUN_BUILD_DEPS = False/g' -i setup.py
python setup.py install --root="${pkgdir}"/ --optimize=1 --skip-build
install -Dm644 LICENSE "${pkgdir}/usr/share/licenses/${pkgname}/LICENSE"
pytorchpath="usr/lib/python$(get_pyver)/site-packages/torch"
install -d "${pkgdir}/usr/lib"
# put CMake files in correct place
mv "${pkgdir}/${pytorchpath}/share/cmake" "${pkgdir}/usr/lib/cmake"
# put C++ API in correct place
mv "${pkgdir}/${pytorchpath}/include" "${pkgdir}/usr/include"
find "${pkgdir}/${pytorchpath}"/lib/ -type f,l \( -iname '*.so' -or -iname '*.so*' \) -print0 | while read -rd $'\0' _lib; do
mv "${_lib}" "${pkgdir}"/usr/lib/
done
# clean up duplicates
rm -r "${pkgdir}/usr/include/pybind11"
rm "${pkgdir}"/usr/include/*.h
# Python module is hardcoded so look there at runtime
ln -s /usr/include "${pkgdir}/${pytorchpath}/include"
find "${pkgdir}"/usr/lib -maxdepth 1 -type f,l \( -iname '*.so' -or -iname '*.so*' \) -print0 | while read -rd $'\0' _lib; do
ln -s ${_lib#"$pkgdir"} "${pkgdir}/${pytorchpath}/lib/"
done
}
package_python-pytorch() {
pkgdesc="${_pkgdesc}"
cd "${srcdir}/${_pkgname}-${pkgver}"
echo "Building without cuda or rocm and without non-x86-64 optimizations"
_prepare
export USE_CUDA=0
export USE_CUDNN=0
export USE_ROCM=0
echo "add_definitions(-march=x86-64)" >> cmake/MiscCheck.cmake
# this horrible hack is necessary because the current release
# ships inconsistent CMake which tries to build objects before
# thier dependencies, build twice when dependencies are available
python setup.py build || python setup.py build
_package
}
package_python-pytorch-opt() {
pkgdesc="${_pkgdesc} (with AVX2 CPU optimizations)"
conflicts=(python-pytorch)
provides=(python-pytorch)
cd "${srcdir}/${_pkgname}-${pkgver}-opt"
echo "Building without cuda or rocm and with non-x86-64 optimizations"
_prepare
export USE_CUDA=0
export USE_CUDNN=0
export USE_ROCM=0
echo "add_definitions(-march=haswell)" >> cmake/MiscCheck.cmake
# same horrible hack as above
python setup.py build || python setup.py build
_package
}
package_python-pytorch-cuda() {
pkgdesc="${_pkgdesc} (with CUDA)"
depends+=(cuda cudnn magma-cuda)
conflicts=(python-pytorch)
provides=(python-pytorch)
cd "${srcdir}/${_pkgname}-${pkgver}-cuda"
echo "Building with cuda and without non-x86-64 optimizations"
_prepare
export USE_CUDA=1
export USE_CUDNN=1
export USE_ROCM=0
cd "${srcdir}/${_pkgname}-${pkgver}-cuda"
echo "add_definitions(-march=x86-64)" >> cmake/MiscCheck.cmake
# same horrible hack as above
python setup.py build || python setup.py build
_package
# oneDNN from the repos conflicts with the version in the ideep submodule,
# so we have to add the dependency after building the package.
depends+=(onednn)
}
package_python-pytorch-opt-cuda() {
pkgdesc="${_pkgdesc} (with CUDA and AVX2 CPU optimizations)"
depends+=(cuda cudnn magma-cuda)
conflicts=(python-pytorch)
provides=(python-pytorch python-pytorch-cuda)
cd "${srcdir}/${_pkgname}-${pkgver}-opt-cuda"
echo "Building with cuda and with non-x86-64 optimizations"
export USE_CUDA=1
export USE_CUDNN=1
export USE_ROCM=0
_prepare
echo "add_definitions(-march=haswell)" >> cmake/MiscCheck.cmake
# same horrible hack as above
python setup.py build || python setup.py build
_package
# see above
depends+=(onednn)
}
package_python-pytorch-rocm() {
pkgdesc="${_pkgdesc} (with ROCm)"
depends+=(rocm-hip-sdk roctracer miopen magma-hip)
conflicts=(python-pytorch)
provides=(python-pytorch)
cd "${srcdir}/${_pkgname}-${pkgver}-rocm"
echo "Building with rocm and without non-x86-64 optimizations"
_prepare
export USE_CUDA=0
export USE_CUDNN=0
export USE_ROCM=1
echo "add_definitions(-march=x86-64)" >> cmake/MiscCheck.cmake
# Conversion of CUDA to ROCm source files
python tools/amd_build/build_amd.py
# same horrible hack as above
python setup.py build || python setup.py build
_package
# see above
depends+=(onednn)
}
package_python-pytorch-opt-rocm() {
pkgdesc="${_pkgdesc} (with ROCm and AVX2 CPU optimizations)"
depends+=(rocm-hip-sdk roctracer miopen magma-hip)
conflicts=(python-pytorch)
provides=(python-pytorch python-pytorch-rocm)
cd "${srcdir}/${_pkgname}-${pkgver}-opt-rocm"
echo "Building with rocm and with non-x86-64 optimizations"
_prepare
export USE_CUDA=0
export USE_CUDNN=0
export USE_ROCM=1
echo "add_definitions(-march=haswell)" >> cmake/MiscCheck.cmake
# Conversion of CUDA to ROCm source files
python tools/amd_build/build_amd.py
# same horrible hack as above
python setup.py build || python setup.py build
_package
# see above
depends+=(onednn)
}
# vim:set ts=2 sw=2 et: