42 lines
2.1 KiB
Bash
42 lines
2.1 KiB
Bash
|
|
#! /bin/bash
|
||
|
|
|
||
|
|
set -e
|
||
|
|
set -x
|
||
|
|
|
||
|
|
CUDA_ROOT="C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v11.2"
|
||
|
|
curl -L -nv -o cuda.exe https://developer.download.nvidia.com/compute/cuda/11.2.2/local_installers/cuda_11.2.2_461.33_win10.exe
|
||
|
|
./cuda.exe -s nvcc_11.2 cudart_11.2 cublas_dev_11.2 curand_dev_11.2
|
||
|
|
rm cuda.exe
|
||
|
|
|
||
|
|
curl -L -nv -o cudnn.zip https://developer.download.nvidia.com/compute/redist/cudnn/v8.1.1/cudnn-11.2-windows-x64-v8.1.1.33.zip
|
||
|
|
unzip cudnn.zip && rm cudnn.zip
|
||
|
|
cp -r cuda/* "$CUDA_ROOT"
|
||
|
|
rm -r cuda/
|
||
|
|
|
||
|
|
# See https://github.com/oneapi-src/oneapi-ci for installer URLs
|
||
|
|
curl -L -nv -o webimage.exe https://registrationcenter-download.intel.com/akdlm/irc_nas/19078/w_BaseKit_p_2023.0.0.25940_offline.exe
|
||
|
|
./webimage.exe -s -x -f webimage_extracted --log extract.log
|
||
|
|
rm webimage.exe
|
||
|
|
./webimage_extracted/bootstrapper.exe -s --action install --components="intel.oneapi.win.mkl.devel" --eula=accept -p=NEED_VS2017_INTEGRATION=0 -p=NEED_VS2019_INTEGRATION=0 --log-dir=.
|
||
|
|
|
||
|
|
ONEDNN_VERSION=3.0.1
|
||
|
|
curl -L -O https://github.com/oneapi-src/oneDNN/archive/refs/tags/v${ONEDNN_VERSION}.tar.gz
|
||
|
|
tar xf *.tar.gz && rm *.tar.gz
|
||
|
|
cd oneDNN-*
|
||
|
|
cmake -DCMAKE_BUILD_TYPE=Release -DDNNL_LIBRARY_TYPE=STATIC -DDNNL_BUILD_EXAMPLES=OFF -DDNNL_BUILD_TESTS=OFF -DDNNL_ENABLE_WORKLOAD=INFERENCE -DDNNL_ENABLE_PRIMITIVE="CONVOLUTION;REORDER" .
|
||
|
|
cmake --build . --config Release --target install --parallel 2
|
||
|
|
cd ..
|
||
|
|
rm -r oneDNN-*
|
||
|
|
|
||
|
|
mkdir build
|
||
|
|
cd build
|
||
|
|
cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_INSTALL_PREFIX=$CTRANSLATE2_ROOT -DCMAKE_PREFIX_PATH="C:/Program Files (x86)/Intel/oneAPI/compiler/latest/windows/compiler/lib/intel64_win;C:/Program Files (x86)/oneDNN" -DBUILD_CLI=OFF -DWITH_DNNL=ON -DWITH_CUDA=ON -DWITH_CUDNN=ON -DCUDA_TOOLKIT_ROOT_DIR="$CUDA_ROOT" -DCUDA_DYNAMIC_LOADING=ON -DCUDA_NVCC_FLAGS="-Xfatbin=-compress-all" -DCUDA_ARCH_LIST="Common" ..
|
||
|
|
cmake --build . --config Release --target install --parallel 2 --verbose
|
||
|
|
cd ..
|
||
|
|
rm -r build
|
||
|
|
|
||
|
|
cp README.md python/
|
||
|
|
cp $CTRANSLATE2_ROOT/bin/ctranslate2.dll python/ctranslate2/
|
||
|
|
cp "C:/Program Files (x86)/Intel/oneAPI/compiler/latest/windows/redist/intel64_win/compiler/libiomp5md.dll" python/ctranslate2/
|
||
|
|
cp "$CUDA_ROOT/bin/cudnn64_8.dll" python/ctranslate2/
|