Skip to content

Commit 2dee5b8

Browse files
Merge branch 'main' into new-delete-aarch64
2 parents db521d4 + 08c724b commit 2dee5b8

File tree

246 files changed

+12412
-3444
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

246 files changed

+12412
-3444
lines changed

.github/CODEOWNERS

+12-8
Original file line numberDiff line numberDiff line change
@@ -17,17 +17,9 @@
1717
# Default
1818
* @oneapi-src/onednn-arch @intel-innersource/dnn-arch
1919

20-
# Codeowners
21-
/.github/CODEOWNERS @oneapi-src/onednn-maintain
22-
/MAINTAINERS.md @oneapi-src/onednn-maintain
23-
2420
# Github automation
2521
/.github/ @oneapi-src/onednn-devops
2622

27-
# Documentation
28-
*.md @oneapi-src/onednn-doc @oneapi-src/onednn-arch @intel-innersource/dnn-doc @intel-innersource/dnn-arch
29-
/doc/ @oneapi-src/onednn-doc @oneapi-src/onednn-arch @intel-innersource/dnn-doc @intel-innersource/dnn-arch
30-
3123
# CPU Engine
3224
/src/cpu/aarch64/ @oneapi-src/onednn-cpu-aarch64 @intel-innersource/dnn-arch
3325
/src/cpu/x64/ @oneapi-src/onednn-cpu-x64 @intel-innersource/dnn-cpu
@@ -52,3 +44,15 @@
5244
# Graph compiler
5345
/src/graph/backend/graph_compiler/ @intel-innersource/dnn-compiler
5446
/tests/gtests/graph/unit/backend/graph_compiler/ @intel-innersource/dnn-compiler
47+
48+
# Documentation
49+
*.md @oneapi-src/onednn-doc @oneapi-src/onednn-arch @intel-innersource/dnn-doc @intel-innersource/dnn-arch
50+
/doc/ @oneapi-src/onednn-doc @oneapi-src/onednn-arch @intel-innersource/dnn-doc @intel-innersource/dnn-arch
51+
52+
# Governance and process
53+
/.github/CODEOWNERS @oneapi-src/onednn-maintain
54+
/SECURITY.md @oneapi-src/onednn-maintain
55+
/MAINTAINERS.md @oneapi-src/onednn-maintain
56+
/CONTRIBUTING.md @oneapi-src/onednn-maintain
57+
/CODING_STANDARDS.md @oneapi-src/onednn-maintain
58+
/CODE_OF_CONDUCT.md @oneapi-src/onednn-maintain

.github/dependabot.yml

+1
Original file line numberDiff line numberDiff line change
@@ -20,5 +20,6 @@ updates:
2020
directory: "/"
2121
schedule:
2222
interval: "weekly"
23+
labels: [ "devops" ]
2324
commit-message:
2425
prefix: "github: workflows"

.github/labels.yml

+85
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,85 @@
1+
#===============================================================================
2+
# Copyright 2024 Intel Corporation
3+
#
4+
# Licensed under the Apache License, Version 2.0 (the "License");
5+
# you may not use this file except in compliance with the License.
6+
# You may obtain a copy of the License at
7+
#
8+
# http://www.apache.org/licenses/LICENSE-2.0
9+
#
10+
# Unless required by applicable law or agreed to in writing, software
11+
# distributed under the License is distributed on an "AS IS" BASIS,
12+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
# See the License for the specific language governing permissions and
14+
# limitations under the License.
15+
#===============================================================================
16+
17+
# This is configuration file for Labeler workflow. See documenation for syntax
18+
# reference: https://github.com/marketplace/actions/labeler
19+
20+
# Labels based on area of responsibility
21+
# Process definition and code owners
22+
governance:
23+
- changed-files:
24+
- any-glob-to-any-file:
25+
- '.github/CODEOWNERS'
26+
- 'SECURITY.md'
27+
- 'MAINTAINERS.md'
28+
- 'CONTRIBUTING.md'
29+
- 'CODING_STANDARDS.md'
30+
- 'CODE_OF_CONDUCT.md'
31+
32+
# Github automation
33+
devops:
34+
- all:
35+
- changed-files:
36+
- any-glob-to-any-file: '.github/**'
37+
- all-globs-to-all-files: '!.github/CODEOWNERS'
38+
39+
# Documentation
40+
documentation:
41+
- changed-files:
42+
- any-glob-to-any-file: ['**/*.md', 'doc/**']
43+
44+
# CPU Engine
45+
platform:cpu-aarch64:
46+
- changed-files:
47+
- any-glob-to-any-file: 'src/cpu/aarch64/**'
48+
49+
platform:cpu-ppc64:
50+
- changed-files:
51+
- any-glob-to-any-file: 'src/cpu/ppc64/**'
52+
53+
platform:cpu-rv64:
54+
- changed-files:
55+
- any-glob-to-any-file: 'src/cpu/rv64/**'
56+
57+
platform:cpu-s390x:
58+
- changed-files:
59+
- any-glob-to-any-file: 'src/cpu/s390x/**'
60+
61+
platform:cpu-x64:
62+
- changed-files:
63+
- any-glob-to-any-file: ['src/cpu/x64/**', 'src/cpu/rnn/**']
64+
65+
# GPU Engine
66+
platform:gpu-amd:
67+
- changed-files:
68+
- any-glob-to-any-file: 'src/gpu/amd/**'
69+
70+
platform:gpu-intel:
71+
- changed-files:
72+
- any-glob-to-any-file: 'src/gpu/intel/**'
73+
74+
platform:gpu-nvidia:
75+
- changed-files:
76+
- any-glob-to-any-file: 'src/gpu/nvidia/**'
77+
78+
platform:gpu-generic:
79+
- changed-files:
80+
- any-glob-to-any-file: 'src/gpu/generic/**'
81+
82+
# Labels based on target branch
83+
# Backport
84+
backport:
85+
- base-branch: 'rls-*'

.github/workflows/labeler.yml

+34
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
#===============================================================================
2+
# Copyright 2024 Intel Corporation
3+
#
4+
# Licensed under the Apache License, Version 2.0 (the "License");
5+
# you may not use this file except in compliance with the License.
6+
# You may obtain a copy of the License at
7+
#
8+
# http://www.apache.org/licenses/LICENSE-2.0
9+
#
10+
# Unless required by applicable law or agreed to in writing, software
11+
# distributed under the License is distributed on an "AS IS" BASIS,
12+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
# See the License for the specific language governing permissions and
14+
# limitations under the License.
15+
#===============================================================================
16+
17+
name: Labeler
18+
on: [pull_request_target]
19+
20+
# Declare default permissions as read only.
21+
permissions: read-all
22+
23+
jobs:
24+
label:
25+
runs-on: ubuntu-latest
26+
permissions:
27+
contents: read
28+
pull-requests: write
29+
30+
steps:
31+
- uses: actions/labeler@v5.0.0
32+
with:
33+
sync-labels: true
34+
configuration-path: '.github/labels.yml'

README.binary.in

+7-4
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,9 @@ The library is optimized for the following CPUs:
3939
* Intel Xeon Scalable processor (formerly Skylake, Cascade Lake, Cooper
4040
Lake, Ice Lake, Sapphire Rapids, and Emerald Rapids)
4141
* Intel Xeon CPU Max Series (formerly Sapphire Rapids HBM)
42-
* future Intel Xeon Scalable processors (code name Sierra Forest
43-
and Granite Rapids)
42+
* Intel Core Ultra processors (formerly Meteor Lake, Arrow Lake,
43+
and Lunar Lake)
44+
* Intel Xeon 6 processors (formerly Sierra Forest and Granite Rapids)
4445

4546
oneDNN detects the instruction set architecture (ISA) at runtime and uses
4647
just-in-time (JIT) code generation to deploy the code optimized
@@ -52,11 +53,13 @@ for more details.
5253

5354
The library is optimized for the following GPUs:
5455
* Intel Graphics for 11th-14th Generation Intel Core Processors
55-
* Intel Graphics for Intel Core Ultra Processors (formerly Meteor Lake)
5656
* Intel Iris Xe MAX Graphics (formerly DG1)
57-
* Intel Arc(TM) Graphics (formerly Alchemist)
57+
* Intel Arc(TM) graphics (formerly Alchemist)
5858
* Intel Data Center GPU Flex Series (formerly Arctic Sound)
5959
* Intel Data Center GPU Max Series (formerly Ponte Vecchio)
60+
* Intel Graphics and Intel Arc graphics for Intel Core Ultra processors
61+
(formerly Meteor Lake, Arrow Lake and Lunar Lake)
62+
* future Intel Arc graphics (code name Battlemage)
6063

6164
Support
6265
-------

README.md

+17-7
Original file line numberDiff line numberDiff line change
@@ -84,14 +84,14 @@ The library is optimized for the following CPUs:
8484
* Intel 64/AMD64 architecture
8585
* Intel Atom(R) processor (at least Intel SSE4.1 support is required)
8686
* Intel Core(TM) processor (at least Intel SSE4.1 support is required)
87-
* Intel Core Ultra processors (formerly Meteor Lake)
8887
* Intel Xeon(R) processor E3, E5, and E7 family (formerly Sandy Bridge,
8988
Ivy Bridge, Haswell, and Broadwell)
9089
* Intel Xeon Scalable processor (formerly Skylake, Cascade Lake, Cooper
9190
Lake, Ice Lake, Sapphire Rapids, and Emerald Rapids)
9291
* Intel Xeon CPU Max Series (formerly Sapphire Rapids HBM)
93-
* future Intel Xeon Scalable processors (code name Sierra Forest
94-
and Granite Rapids)
92+
* Intel Core Ultra processors (formerly Meteor Lake, Arrow Lake,
93+
and Lunar Lake)
94+
* Intel Xeon 6 processors (formerly Sierra Forest and Granite Rapids)
9595
* AArch64 architecture
9696
* Arm Neoverse(TM) N1 and V1 processors
9797

@@ -111,11 +111,13 @@ require the use of run-time controls to enable them. See
111111
112112
The library is optimized for the following GPUs:
113113
* Intel Graphics for 11th-14th Generation Intel Core Processors
114-
* Intel Graphics for Intel Core Ultra processors (formerly Meteor Lake)
115114
* Intel Iris Xe MAX Graphics (formerly DG1)
116115
* Intel Arc(TM) graphics (formerly Alchemist)
117116
* Intel Data Center GPU Flex Series (formerly Arctic Sound)
118117
* Intel Data Center GPU Max Series (formerly Ponte Vecchio)
118+
* Intel Graphics and Intel Arc graphics for Intel Core Ultra processors
119+
(formerly Meteor Lake, Arrow Lake and Lunar Lake)
120+
* future Intel Arc graphics (code name Battlemage)
119121

120122
[CPU dispatcher control]: https://oneapi-src.github.io/oneDNN/dev_guide_cpu_dispatcher_control.html
121123
[Linking Guide]: https://oneapi-src.github.io/oneDNN/dev_guide_link.html
@@ -171,7 +173,7 @@ On a CPU based on Arm AArch64 architecture, oneDNN CPU engine can be built with
171173
machine learning applications and provides AArch64 optimized implementations
172174
of core functions. This functionality currently requires that ACL is downloaded
173175
and built separately. See [Build from Source] section of the Developer Guide for
174-
details. oneDNN only supports Compute Library versions 24.07 or later.
176+
details. oneDNN only supports Compute Library versions 24.08 or later.
175177

176178
[Arm Compute Library (ACL)]: https://github.com/arm-software/ComputeLibrary
177179

@@ -201,6 +203,9 @@ is enabled:
201203
version of MIOpen)
202204
* [rocBLAS] version 2.45.0 or later (optional if AMD ROCm includes
203205
the required version of rocBLAS)
206+
* SYCL runtime with a generic GPU support requires
207+
* oneAPI DPC++/C++ Compiler that supports the target GPU. Refer to the
208+
[generic GPU vendor readme](src/gpu/generic/sycl/README.md) for more information.
204209

205210
> **WARNING**
206211
>
@@ -374,9 +379,12 @@ discussions.
374379

375380
# Contributing
376381

377-
We welcome community contributions to oneDNN. If you have an idea on how
378-
to improve the library:
382+
We welcome community contributions to oneDNN. You can find the oneDNN release
383+
schedule and work already in progress towards future milestones in Github's
384+
[Milestones] section. If you are looking for a specific task to start,
385+
consider selecting from issues that are marked with the [help wanted] label.
379386

387+
If you have an idea on how to improve the library:
380388
* For changes impacting the public API or library overall, such as adding new
381389
primitives or changes to the architecture, submit an [RFC pull request].
382390
* Ensure that the changes are consistent with the [code contribution guidelines]
@@ -397,6 +405,8 @@ contributors are expected to adhere to the
397405
[code contribution guidelines]: CONTRIBUTING.md#code-contribution-guidelines
398406
[coding standards]: CONTRIBUTING.md#coding-standards
399407
[pull request]: https://github.com/oneapi-src/oneDNN/pulls
408+
[Milestones]: https://github.com/oneapi-src/oneDNN/milestones
409+
[help wanted]: https://github.com/oneapi-src/oneDNN/issues?q=is%3Aissue+is%3Aopen+label%3A%22help+wanted%22
400410

401411
# License
402412

cmake/ACL.cmake

+1-1
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ endif()
3131

3232
find_package(ACL REQUIRED)
3333

34-
set(ACL_MINIMUM_VERSION "24.07")
34+
set(ACL_MINIMUM_VERSION "24.08")
3535

3636
if(ACL_FOUND)
3737
file(GLOB_RECURSE ACL_VERSION_FILE ${ACL_INCLUDE_DIR}/*/arm_compute_version.embed)

cmake/SYCL.cmake

+12-3
Original file line numberDiff line numberDiff line change
@@ -74,16 +74,19 @@ macro(adjust_headers_priority targets)
7474
endif()
7575
endmacro()
7676

77-
if(DNNL_SYCL_CUDA)
77+
macro(suppress_warnings_for_nvidia_target)
7878
# XXX: Suppress warning coming from SYCL headers:
7979
# error: use of function template name with no prior declaration in
8080
# function call with eplicit template arguments is a C++20 extension
81-
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-c++20-extensions")
81+
append(CMAKE_CXX_FLAGS "-Wno-c++20-extensions")
8282

8383
# Suppress LLVM warning about not supporting latest cuda. It's safe enough
8484
# as long as no new cuda features are used in SYCL kernels.
85-
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-unknown-cuda-version")
85+
append(CMAKE_CXX_FLAGS "-Wno-unknown-cuda-version")
86+
endmacro()
8687

88+
if(DNNL_SYCL_CUDA)
89+
suppress_warnings_for_nvidia_target()
8790
find_package(cuBLAS REQUIRED)
8891
find_package(cuDNN REQUIRED)
8992

@@ -102,6 +105,12 @@ elseif(DNNL_SYCL_HIP)
102105

103106
list(APPEND EXTRA_SHARED_LIBS HIP::HIP rocBLAS::rocBLAS MIOpen::MIOpen)
104107
message(STATUS "DPC++ support is enabled (HIP)")
108+
elseif(DNNL_SYCL_GENERIC)
109+
CHECK_CXX_COMPILER_FLAG("-fsycl -fsycl-targets=nvptx64-nvidia-cuda" NVIDIA_TARGET_SUPPORTED)
110+
111+
if(NVIDIA_TARGET_SUPPORTED)
112+
suppress_warnings_for_nvidia_target()
113+
endif()
105114
else()
106115
find_library(OPENCL_LIBRARY OpenCL PATHS ENV LIBRARY_PATH ENV LIB NO_DEFAULT_PATH)
107116
if(OPENCL_LIBRARY)

cmake/options.cmake

+5-1
Original file line numberDiff line numberDiff line change
@@ -298,7 +298,7 @@ if(NOT DNNL_GPU_RUNTIME STREQUAL "NONE" AND DNNL_GPU_VENDOR STREQUAL "NONE")
298298
set(DNNL_GPU_VENDOR "INTEL")
299299
endif()
300300

301-
if(NOT "${DNNL_GPU_VENDOR}" MATCHES "^(NONE|INTEL|NVIDIA|AMD)$")
301+
if(NOT "${DNNL_GPU_VENDOR}" MATCHES "^(NONE|INTEL|NVIDIA|AMD|GENERIC)$")
302302
message(FATAL_ERROR "Unsupported GPU vendor: ${DNNL_GPU_VENDOR}")
303303
endif()
304304

@@ -322,12 +322,16 @@ if(DNNL_GPU_RUNTIME STREQUAL "DPCPP" OR DNNL_GPU_RUNTIME STREQUAL "SYCL")
322322
set(DNNL_GPU_SYCL true)
323323
set(DNNL_SYCL_CUDA OFF)
324324
set(DNNL_SYCL_HIP OFF)
325+
set(DNNL_SYCL_GENERIC OFF)
325326
if(DNNL_GPU_VENDOR STREQUAL "NVIDIA")
326327
set(DNNL_SYCL_CUDA ON)
327328
endif()
328329
if(DNNL_GPU_VENDOR STREQUAL "AMD")
329330
set(DNNL_SYCL_HIP ON)
330331
endif()
332+
if(DNNL_GPU_VENDOR STREQUAL "GENERIC")
333+
set(DNNL_SYCL_GENERIC ON)
334+
endif()
331335
else()
332336
set(DNNL_GPU_SYCL false)
333337
endif()

0 commit comments

Comments
 (0)