Skip to content

Commit 1bdf83c

Browse files
praveenkk123Praveen Kundurthy
and
Praveen Kundurthy
authored
changed the default sub-group size to 32 (#1406)
Co-authored-by: Praveen Kundurthy <[email protected]>
1 parent 6fc3284 commit 1bdf83c

File tree

3 files changed

+6
-6
lines changed

3 files changed

+6
-6
lines changed

DirectProgramming/C++SYCL/Jupyter/oneapi-essentials-training/04_SYCL_Sub_Groups/Sub_Groups.ipynb

+4-4
Original file line numberDiff line numberDiff line change
@@ -357,7 +357,7 @@
357357
" auto out = stream(1024, 768, h);\n",
358358
"\n",
359359
" //# nd-range kernel with user specified sub_group size\n",
360-
" h.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(8)]] {\n",
360+
" h.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(32)]] {\n",
361361
" //# get sub_group handle\n",
362362
" auto sg = item.get_sub_group();\n",
363363
"\n",
@@ -783,7 +783,7 @@
783783
" for(int i=0; i<N; i++) std::cout << input[i] << \" \"; std::cout << \"\\n\"; \n",
784784
"\n",
785785
" //# use parallel_for and sub_groups\n",
786-
" q.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(8)]] {\n",
786+
" q.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(32)]] {\n",
787787
" auto sg = item.get_sub_group();\n",
788788
" auto i = item.get_global_id(0);\n",
789789
"\n",
@@ -976,7 +976,7 @@
976976
],
977977
"metadata": {
978978
"kernelspec": {
979-
"display_name": "Python 3.7 (Intel® oneAPI)",
979+
"display_name": "Python 3 (Intel® oneAPI 2023.0)",
980980
"language": "python",
981981
"name": "c009-intel_distribution_of_python_3_oneapi-beta05-python"
982982
},
@@ -990,7 +990,7 @@
990990
"name": "python",
991991
"nbconvert_exporter": "python",
992992
"pygments_lexer": "ipython3",
993-
"version": "3.9.7"
993+
"version": "3.9.15"
994994
},
995995
"toc": {
996996
"base_numbering": 1,

DirectProgramming/C++SYCL/Jupyter/oneapi-essentials-training/04_SYCL_Sub_Groups/lab/sub_group_reqd_size.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ int main() {
2727
auto out = stream(1024, 768, h);
2828

2929
//# nd-range kernel with user specified sub_group size
30-
h.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(8)]] {
30+
h.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(32)]] {
3131
//# get sub_group handle
3232
auto sg = item.get_sub_group();
3333

DirectProgramming/C++SYCL/Jupyter/oneapi-essentials-training/04_SYCL_Sub_Groups/lab/sub_group_votes.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ int main() {
2525
for(int i=0; i<N; i++) std::cout << input[i] << " "; std::cout << "\n";
2626

2727
//# use parallel_for and sub_groups
28-
q.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(8)]] {
28+
q.parallel_for(nd_range<1>(N, B), [=](nd_item<1> item)[[intel::reqd_sub_group_size(32)]] {
2929
auto sg = item.get_sub_group();
3030
auto i = item.get_global_id(0);
3131

0 commit comments

Comments
 (0)