Skip to content

Commit 9e764b5

Browse files
authored
Merge pull request #23 from howetuft/work
Work
2 parents 5623593 + 2765552 commit 9e764b5

File tree

10 files changed

+86
-11
lines changed

10 files changed

+86
-11
lines changed

.github/workflows/wheels.yml

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,8 @@ jobs:
2828
#os: [ubuntu-latest]
2929
#python-minor: [ 11]
3030
#os: [windows-latest]
31+
#python-minor: [ 11]
32+
#os: [macos-13]
3133
exclude:
3234
- os: macos-14
3335
python-minor: 8
@@ -93,6 +95,13 @@ jobs:
9395
core.exportVariable('CCACHE_DEBUGDIR', String.raw`${{ github.workspace }}/ccache-debug`);
9496
core.exportVariable('CCACHE_LOGFILE', String.raw`${{ github.workspace }}/ccache.log`);
9597
98+
99+
- name: Update apt (Linux)
100+
if: runner.os == 'Linux'
101+
shell: bash
102+
run: |
103+
sudo apt-get update -y
104+
96105
- name: ccache
97106
uses: hendrikmuhs/[email protected]
98107
with:
@@ -219,9 +228,10 @@ jobs:
219228
CIBW_REPAIR_WHEEL_COMMAND_LINUX: |
220229
TBB=/project/full_deploy/host/onetbb/$TBB_VERSION/Release/x86_64/lib
221230
OIDN=/project/full_deploy/host/oidn/$OIDN_VERSION/Release/x86_64/lib
231+
EMBREE3=/project/full_deploy/host/embree3/$EMBREE3_VERSION/Release/x86_64/lib
222232
HWLOC=/project/full_deploy/host/hwloc/2.9.3/Release/x86_64/lib
223233
LEVEL_ZERO=/project/full_deploy/host/level-zero/1.17.39/Release/x86_64/lib
224-
LD_LIBRARY_PATH=$TBB:$HWLOC:$LEVEL_ZERO:$OIDN:$LD_LIBRARY_PATH
234+
LD_LIBRARY_PATH=$TBB:$HWLOC:$LEVEL_ZERO:$OIDN:$EMBREE3:$LD_LIBRARY_PATH
225235
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}"
226236
export LD_LIBRARY_PATH
227237

.gitignore

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,12 @@ __pycache__/
66
# C extensions
77
*.so
88

9+
# ccache
10+
.ccache/
11+
12+
# conan-cache content
13+
conan-cache/*
14+
915
# Distribution / packaging
1016
.Python
1117
build/

conan-profiles/conan-profile-Linux-X64

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -8,9 +8,12 @@ compiler.version=12
88
compiler.cppstd={{ os.getenv("CXX_VERSION") }}
99
compiler.libcxx=libstdc++11
1010

11-
[conf]
12-
openvdb/*:tools.cmake.cmaketoolchain:extra_variables={ 'USE_CCACHE':'OFF' }
13-
1411
[options]
1512
openvdb/*:simd=AVX
13+
embree3/*:avx2=True
1614
embree3/*:avx512=True
15+
16+
[conf]
17+
tools.build:cflags+=["-ftree-vectorize", "-march=x86-64-v3", "-O3"]
18+
tools.build:cxxflags+=["-ftree-vectorize", "-march=x86-64-v3", "-O3"]
19+
openvdb/*:tools.cmake.cmaketoolchain:extra_variables={ 'USE_CCACHE':'OFF' }

conan-profiles/conan-profile-Windows-X64

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,8 +10,9 @@ compiler.runtime=dynamic
1010

1111
[conf]
1212
tools.env.virtualenv:powershell=False
13-
tools.build:cxxflags=["/openmp", "/MP", "/DEBUG:NONE"]
13+
tools.build:cxxflags=["/openmp", "/MP", "/DEBUG:NONE", "/O2", "/arch:AVX"]
14+
embree3/*:tools.build:cxxflags=["/openmp", "/MP", "/DEBUG:NONE", "/O2"]
1415

1516
[options]
1617
openvdb/*:simd=AVX
17-
embree3/*:avx=True
18+
# NB: MSVC does not support avx2 nor avx512

conan-profiles/conan-profile-common

Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,3 +16,45 @@ yasm/*
1616

1717
[options]
1818
oidn/*:shared=True
19+
embree3/*:shared=True
20+
embree3/*:with_tbb=True
21+
embree3/*:sse2=True
22+
embree3/*:sse42=True
23+
embree3/*:avx=True
24+
25+
26+
# boost/*:without_atomic=True
27+
boost/*:without_charconv=True
28+
# boost/*:without_chrono=True
29+
boost/*:without_cobalt=True
30+
# boost/*:without_container=True
31+
boost/*:without_context=True
32+
boost/*:without_contract=True
33+
boost/*:without_coroutine=True
34+
# boost/*:without_date_time=True
35+
# boost/*:without_exception=True
36+
boost/*:without_fiber=True
37+
# boost/*:without_filesystem=True
38+
# boost/*:without_graph=True
39+
boost/*:without_graph_parallel=True
40+
# boost/*:without_iostreams=True
41+
boost/*:without_json=True
42+
boost/*:without_locale=True
43+
boost/*:without_log=True
44+
# boost/*:without_math=True
45+
boost/*:without_mpi=True
46+
boost/*:without_nowide=True
47+
boost/*:without_process=True
48+
# boost/*:without_program_options=True
49+
boost/*:without_python=True
50+
# boost/*:without_random=True
51+
# boost/*:without_regex=True
52+
# boost/*:without_serialization=True
53+
boost/*:without_stacktrace=True
54+
# boost/*:without_system=True
55+
boost/*:without_test=True
56+
# boost/*:without_thread=True
57+
boost/*:without_timer=True
58+
boost/*:without_type_erasure=True
59+
boost/*:without_url=True
60+
boost/*:without_wave=True

conan-profiles/conan-profile-macOS-ARM64

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -30,10 +30,15 @@ compiler.libcxx=libc++
3030
[options]
3131
minizip-ng/*:with_zlib=True
3232
minizip-ng/*:with_libcomp=False
33+
embree3/*:sse2=False
34+
embree3/*:sse42=False
35+
embree3/*:avx=False
36+
embree3/*:avx2=False
3337
embree3/*:neon2x=True
3438

3539
{% endif %}
3640

3741
[buildenv]
3842
CXX=clang++
3943
CC=clang
44+
&:tools.build:cxxflags=["-O3"]

conan-profiles/conan-profile-macOS-X64

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,11 @@ compiler.libcxx=libc++
1313
minizip-ng/*:with_zlib=True
1414
minizip-ng/*:with_libcomp=False
1515
openvdb/*:simd=AVX
16-
embree3/*:avx512=True
17-
embree3/*:shared=True
1816

1917
[buildenv]
2018
CXX=clang++
2119
CC=clang
20+
21+
[conf]
22+
&:tools.build:cxxflags+=["-ftree-vectorize", "-march=x86-64-v3", "-O3", "-mno-avx2"]
23+
# NB: Github MacOS X64 runner does not support avx2 nor avx512

doc/notes.md

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -91,7 +91,12 @@ author).
9191
tried to have it minimal and it's 10.13. For the delocation to succeed, we also
9292
have to set `MACOSX_DEPLOYMENT_TARGET` environment variable to 10.13.
9393

94+
## Vectorization
95+
For Intel, we stick to x86-64-v3 (Haswell, 2013), no more. For all platform
96+
except MacOS Intel, we rely on "-O" option.
97+
For MacOS Intel: Github runner is not standard, we have to deactivate avx2
98+
extensions. Otherwise `pyluxcore.so` cannot be tested ("Illegal instruction").
99+
See https://github.com/ggerganov/whisper.cpp/issues/358 and `sysctl -a
100+
machdep.cpu`
94101

95102

96-
we
97-

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ build-backend = "scikit_build_core.build"
88

99
[project]
1010
name = "pyluxcore"
11-
version = "2.9a1.post12"
11+
version = "2.9a1.post13"
1212
dependencies = [
1313
"numpy >= 2; python_version > '3.8'",
1414
"numpy < 2; python_version <= '3.8'",

scripts/repair_wheel_windows.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@ delvewheel repair -v \
2727
--add-path="${redist_paths}" \
2828
--add-path="C:/Users/runneradmin/full_deploy/host/onetbb/${TBB_VERSION}/Release/x86_64/bin" \
2929
--add-path="C:/Users/runneradmin/full_deploy/host/oidn/${OIDN_VERSION}/Release/x86_64/bin" \
30+
--add-path="C:/Users/runneradmin/full_deploy/host/embree3/${EMBREE3_VERSION}/Release/x86_64/bin" \
3031
-w "${dest_dir}" \
3132
"${wheel}"
3233

0 commit comments

Comments
 (0)