diff options
Diffstat (limited to 'dynamic-layers/clang-layer/recipes-devtools/clang')
13 files changed, 0 insertions, 18202 deletions
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Fix-debug-info-of-work-item-builtin-translation-745.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Fix-debug-info-of-work-item-builtin-translation-745.patch deleted file mode 100644 index 923b871f..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Fix-debug-info-of-work-item-builtin-translation-745.patch +++ /dev/null | |||
| @@ -1,119 +0,0 @@ | |||
| 1 | From 200c200eb19602ffd7c8f29d0b2df9df1fd311bf Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 3 | Date: Wed, 7 Apr 2021 17:44:20 +0800 | ||
| 4 | Subject: [PATCH] Fix debug info of work-item builtin translation (#745) | ||
| 5 | |||
| 6 | debug info of work-item builtins are lost in both llvm IR -> spirv and | ||
| 7 | spirv -> llvm IR translations. See #744 | ||
| 8 | |||
| 9 | Upstream-Status: Backport [https://github.com/KhronosGroup/SPIRV-LLVM-Translator/commit/c734c5c8bbd3012a09c610e4be68e90cc603c580] | ||
| 10 | Signed-off-by: Wenju He <wenju.he@intel.com> | ||
| 11 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 12 | --- | ||
| 13 | lib/SPIRV/OCL20ToSPIRV.cpp | 5 ++- | ||
| 14 | lib/SPIRV/SPIRVReader.cpp | 1 + | ||
| 15 | test/DebugInfo/builtin-get-global-id.ll | 60 +++++++++++++++++++++++++ | ||
| 16 | 3 files changed, 65 insertions(+), 1 deletion(-) | ||
| 17 | create mode 100644 test/DebugInfo/builtin-get-global-id.ll | ||
| 18 | |||
| 19 | diff --git a/lib/SPIRV/OCL20ToSPIRV.cpp b/lib/SPIRV/OCL20ToSPIRV.cpp | ||
| 20 | index 1262c48c..a742c8cf 100644 | ||
| 21 | --- a/lib/SPIRV/OCL20ToSPIRV.cpp | ||
| 22 | +++ b/lib/SPIRV/OCL20ToSPIRV.cpp | ||
| 23 | @@ -1297,11 +1297,14 @@ void OCL20ToSPIRV::transWorkItemBuiltinsToVariables() { | ||
| 24 | for (auto UI = I.user_begin(), UE = I.user_end(); UI != UE; ++UI) { | ||
| 25 | auto CI = dyn_cast<CallInst>(*UI); | ||
| 26 | assert(CI && "invalid instruction"); | ||
| 27 | - Value *NewValue = new LoadInst(BV, "", CI); | ||
| 28 | + const DebugLoc &DLoc = CI->getDebugLoc(); | ||
| 29 | + Instruction *NewValue = new LoadInst(BV, "", CI); | ||
| 30 | + NewValue->setDebugLoc(DLoc); | ||
| 31 | LLVM_DEBUG(dbgs() << "Transform: " << *CI << " => " << *NewValue << '\n'); | ||
| 32 | if (IsVec) { | ||
| 33 | NewValue = | ||
| 34 | ExtractElementInst::Create(NewValue, CI->getArgOperand(0), "", CI); | ||
| 35 | + NewValue->setDebugLoc(DLoc); | ||
| 36 | LLVM_DEBUG(dbgs() << *NewValue << '\n'); | ||
| 37 | } | ||
| 38 | NewValue->takeName(CI); | ||
| 39 | diff --git a/lib/SPIRV/SPIRVReader.cpp b/lib/SPIRV/SPIRVReader.cpp | ||
| 40 | index 16a3dd38..528f6663 100644 | ||
| 41 | --- a/lib/SPIRV/SPIRVReader.cpp | ||
| 42 | +++ b/lib/SPIRV/SPIRVReader.cpp | ||
| 43 | @@ -307,6 +307,7 @@ bool SPIRVToLLVM::transOCLBuiltinFromVariable(GlobalVariable *GV, | ||
| 44 | auto Replace = [&](std::vector<Value *> Arg, Instruction *I) { | ||
| 45 | auto Call = CallInst::Create(Func, Arg, "", I); | ||
| 46 | Call->takeName(I); | ||
| 47 | + Call->setDebugLoc(I->getDebugLoc()); | ||
| 48 | setAttrByCalledFunc(Call); | ||
| 49 | SPIRVDBG(dbgs() << "[transOCLBuiltinFromVariable] " << *I << " -> " << *Call | ||
| 50 | << '\n';) | ||
| 51 | diff --git a/test/DebugInfo/builtin-get-global-id.ll b/test/DebugInfo/builtin-get-global-id.ll | ||
| 52 | new file mode 100644 | ||
| 53 | index 00000000..a4a00e63 | ||
| 54 | --- /dev/null | ||
| 55 | +++ b/test/DebugInfo/builtin-get-global-id.ll | ||
| 56 | @@ -0,0 +1,60 @@ | ||
| 57 | +; Check debug info of builtin get_global_id is preserved from LLVM IR to spirv | ||
| 58 | +; and spirv to LLVM IR translation. | ||
| 59 | + | ||
| 60 | +; Original .cl source: | ||
| 61 | +; kernel void test() { | ||
| 62 | +; size_t gid = get_global_id(0); | ||
| 63 | +; } | ||
| 64 | + | ||
| 65 | +; Command line: | ||
| 66 | +; ./clang -cc1 1.cl -triple spir64 -cl-std=cl2.0 -emit-llvm -finclude-default-header -debug-info-kind=line-tables-only -O0 | ||
| 67 | + | ||
| 68 | +; RUN: llvm-as %s -o %t.bc | ||
| 69 | +; RUN: llvm-spirv %t.bc -spirv-text -o - | FileCheck %s --check-prefix CHECK-SPIRV | ||
| 70 | +; RUN: llvm-spirv %t.bc -o %t.spv | ||
| 71 | +; RUN: llvm-spirv -r %t.spv -o - | llvm-dis -o - | FileCheck %s | ||
| 72 | + | ||
| 73 | +target datalayout = "e-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024" | ||
| 74 | +target triple = "spir64" | ||
| 75 | + | ||
| 76 | +; CHECK-SPIRV: ExtInst {{.*}} DebugScope | ||
| 77 | +; CHECK-SPIRV-NEXT: Line {{[0-9]+}} 2 16 | ||
| 78 | +; CHECK-SPIRV-NEXT: Load {{[0-9]+}} [[LoadRes:[0-9]+]] | ||
| 79 | +; CHECK-SPIRV-NEXT: CompositeExtract {{[0-9]+}} {{[0-9]+}} [[LoadRes]] 0 | ||
| 80 | + | ||
| 81 | +; Function Attrs: convergent noinline norecurse nounwind optnone | ||
| 82 | +define spir_kernel void @test() #0 !dbg !7 !kernel_arg_addr_space !2 !kernel_arg_access_qual !2 !kernel_arg_type !2 !kernel_arg_base_type !2 !kernel_arg_type_qual !2 { | ||
| 83 | +entry: | ||
| 84 | + %gid = alloca i64, align 8 | ||
| 85 | + %call = call spir_func i64 @_Z13get_global_idj(i32 0) #2, !dbg !10 | ||
| 86 | +; CHECK: %call = call spir_func i64 @_Z13get_global_idj(i32 0) #1, !dbg [[DBG:![0-9]+]] | ||
| 87 | + store i64 %call, i64* %gid, align 8, !dbg !11 | ||
| 88 | + ret void, !dbg !12 | ||
| 89 | +} | ||
| 90 | + | ||
| 91 | +; Function Attrs: convergent nounwind readnone | ||
| 92 | +declare spir_func i64 @_Z13get_global_idj(i32) #1 | ||
| 93 | + | ||
| 94 | +attributes #0 = { convergent noinline norecurse nounwind optnone "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "uniform-work-group-size"="false" "unsafe-fp-math"="false" "use-soft-float"="false" } | ||
| 95 | +attributes #1 = { convergent nounwind readnone "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" } | ||
| 96 | +attributes #2 = { convergent nounwind readnone } | ||
| 97 | + | ||
| 98 | +!llvm.dbg.cu = !{!0} | ||
| 99 | +!llvm.module.flags = !{!3, !4} | ||
| 100 | +!opencl.ocl.version = !{!5} | ||
| 101 | +!opencl.spir.version = !{!5} | ||
| 102 | +!llvm.ident = !{!6} | ||
| 103 | + | ||
| 104 | +!0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, producer: "clang version 12.0.0 (https://github.com/llvm/llvm-project.git b5bc56da8aa23dc57db9d286b0591dbcf9b1bdd3)", isOptimized: false, runtimeVersion: 0, emissionKind: LineTablesOnly, enums: !2, nameTableKind: None) | ||
| 105 | +!1 = !DIFile(filename: "<stdin>", directory: "") | ||
| 106 | +!2 = !{} | ||
| 107 | +!3 = !{i32 2, !"Debug Info Version", i32 3} | ||
| 108 | +!4 = !{i32 1, !"wchar_size", i32 4} | ||
| 109 | +!5 = !{i32 2, i32 0} | ||
| 110 | +!6 = !{!"clang version 12.0.0 (https://github.com/llvm/llvm-project.git b5bc56da8aa23dc57db9d286b0591dbcf9b1bdd3)"} | ||
| 111 | +!7 = distinct !DISubprogram(name: "test", scope: !8, file: !8, line: 1, type: !9, scopeLine: 1, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !2) | ||
| 112 | +!8 = !DIFile(filename: "1.cl", directory: "") | ||
| 113 | +!9 = !DISubroutineType(types: !2) | ||
| 114 | +!10 = !DILocation(line: 2, column: 16, scope: !7) | ||
| 115 | +!11 = !DILocation(line: 2, column: 10, scope: !7) | ||
| 116 | +!12 = !DILocation(line: 3, column: 1, scope: !7) | ||
| 117 | -- | ||
| 118 | 2.17.1 | ||
| 119 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Memory-leak-fix-for-Managed-Static-Mutex.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Memory-leak-fix-for-Managed-Static-Mutex.patch deleted file mode 100644 index 103dad5e..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0001-Memory-leak-fix-for-Managed-Static-Mutex.patch +++ /dev/null | |||
| @@ -1,35 +0,0 @@ | |||
| 1 | From c86c43b70e029b102543e8a85d269cbeb5c00279 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: juanrod2 <> | ||
| 3 | Date: Tue, 22 Dec 2020 08:33:08 +0800 | ||
| 4 | Subject: [PATCH] Memory leak fix for Managed Static Mutex | ||
| 5 | |||
| 6 | Upstream-Status: Backport [Taken from opencl-clang patches; https://github.com/intel/opencl-clang/blob/ocl-open-100/patches/llvm/0001-Memory-leak-fix-for-Managed-Static-Mutex.patch] | ||
| 7 | |||
| 8 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 9 | |||
| 10 | Cleaning a mutex inside ManagedStatic llvm class. | ||
| 11 | --- | ||
| 12 | llvm/lib/Support/ManagedStatic.cpp | 6 +++++- | ||
| 13 | 1 file changed, 5 insertions(+), 1 deletion(-) | ||
| 14 | |||
| 15 | diff --git a/llvm/lib/Support/ManagedStatic.cpp b/llvm/lib/Support/ManagedStatic.cpp | ||
| 16 | index 053493f72fb5..6571580ccecf 100644 | ||
| 17 | --- a/llvm/lib/Support/ManagedStatic.cpp | ||
| 18 | +++ b/llvm/lib/Support/ManagedStatic.cpp | ||
| 19 | @@ -76,8 +76,12 @@ void ManagedStaticBase::destroy() const { | ||
| 20 | |||
| 21 | /// llvm_shutdown - Deallocate and destroy all ManagedStatic variables. | ||
| 22 | void llvm::llvm_shutdown() { | ||
| 23 | - std::lock_guard<std::recursive_mutex> Lock(*getManagedStaticMutex()); | ||
| 24 | + getManagedStaticMutex()->lock(); | ||
| 25 | |||
| 26 | while (StaticList) | ||
| 27 | StaticList->destroy(); | ||
| 28 | + | ||
| 29 | + getManagedStaticMutex()->unlock(); | ||
| 30 | + delete ManagedStaticMutex; | ||
| 31 | + ManagedStaticMutex = nullptr; | ||
| 32 | } | ||
| 33 | -- | ||
| 34 | 2.29.2 | ||
| 35 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0002-Add-cl_khr_extended_subgroup-extensions.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/0002-Add-cl_khr_extended_subgroup-extensions.patch deleted file mode 100644 index cbe492c4..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/0002-Add-cl_khr_extended_subgroup-extensions.patch +++ /dev/null | |||
| @@ -1,812 +0,0 @@ | |||
| 1 | From 27d47f1a17c8921b07acc8cdc26e38cc609de4a9 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 3 | Date: Wed, 7 Apr 2021 16:38:38 +0800 | ||
| 4 | Subject: [PATCH 2/2] Add cl_khr_extended_subgroup extensions. | ||
| 5 | |||
| 6 | Added extensions and their function declarations into | ||
| 7 | the standard header. | ||
| 8 | |||
| 9 | Patch by Piotr Fusik! | ||
| 10 | |||
| 11 | Tags: #clang | ||
| 12 | |||
| 13 | Upstream-Status: Backport [https://github.com/llvm/llvm-project/commit/4a4402f0d72167477a6252e4c3daf5089ebc8f9a] | ||
| 14 | Signed-off-by: Anastasia Stulova <anastasia.stulova@arm.com> | ||
| 15 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 16 | --- | ||
| 17 | .../include/clang/Basic/OpenCLExtensions.def | 7 + | ||
| 18 | clang/lib/Headers/opencl-c.h | 668 ++++++++++++++++++ | ||
| 19 | clang/test/SemaOpenCL/extension-version.cl | 83 +++ | ||
| 20 | 3 files changed, 758 insertions(+) | ||
| 21 | |||
| 22 | diff --git a/clang/include/clang/Basic/OpenCLExtensions.def b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 23 | index 608f78a13eef..d1574164f9b2 100644 | ||
| 24 | --- a/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 25 | +++ b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 26 | @@ -74,6 +74,13 @@ OPENCLEXT_INTERNAL(cl_khr_mipmap_image_writes, 200, ~0U) | ||
| 27 | OPENCLEXT_INTERNAL(cl_khr_srgb_image_writes, 200, ~0U) | ||
| 28 | OPENCLEXT_INTERNAL(cl_khr_subgroups, 200, ~0U) | ||
| 29 | OPENCLEXT_INTERNAL(cl_khr_terminate_context, 200, ~0U) | ||
| 30 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_extended_types, 200, ~0U) | ||
| 31 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_non_uniform_vote, 200, ~0U) | ||
| 32 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_ballot, 200, ~0U) | ||
| 33 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_non_uniform_arithmetic, 200, ~0U) | ||
| 34 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_shuffle, 200, ~0U) | ||
| 35 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_shuffle_relative, 200, ~0U) | ||
| 36 | +OPENCLEXT_INTERNAL(cl_khr_subgroup_clustered_reduce, 200, ~0U) | ||
| 37 | |||
| 38 | // Clang Extensions. | ||
| 39 | OPENCLEXT_INTERNAL(cl_clang_storage_class_specifiers, 100, ~0U) | ||
| 40 | diff --git a/clang/lib/Headers/opencl-c.h b/clang/lib/Headers/opencl-c.h | ||
| 41 | index 93a946cec5b1..67d900eb1c3d 100644 | ||
| 42 | --- a/clang/lib/Headers/opencl-c.h | ||
| 43 | +++ b/clang/lib/Headers/opencl-c.h | ||
| 44 | @@ -17530,6 +17530,674 @@ double __ovld __conv sub_group_scan_inclusive_max(double x); | ||
| 45 | |||
| 46 | #endif //cl_khr_subgroups cl_intel_subgroups | ||
| 47 | |||
| 48 | +#if defined(cl_khr_subgroup_extended_types) | ||
| 49 | +char __ovld __conv sub_group_broadcast( char value, uint index ); | ||
| 50 | +char2 __ovld __conv sub_group_broadcast( char2 value, uint index ); | ||
| 51 | +char3 __ovld __conv sub_group_broadcast( char3 value, uint index ); | ||
| 52 | +char4 __ovld __conv sub_group_broadcast( char4 value, uint index ); | ||
| 53 | +char8 __ovld __conv sub_group_broadcast( char8 value, uint index ); | ||
| 54 | +char16 __ovld __conv sub_group_broadcast( char16 value, uint index ); | ||
| 55 | + | ||
| 56 | +uchar __ovld __conv sub_group_broadcast( uchar value, uint index ); | ||
| 57 | +uchar2 __ovld __conv sub_group_broadcast( uchar2 value, uint index ); | ||
| 58 | +uchar3 __ovld __conv sub_group_broadcast( uchar3 value, uint index ); | ||
| 59 | +uchar4 __ovld __conv sub_group_broadcast( uchar4 value, uint index ); | ||
| 60 | +uchar8 __ovld __conv sub_group_broadcast( uchar8 value, uint index ); | ||
| 61 | +uchar16 __ovld __conv sub_group_broadcast( uchar16 value, uint index ); | ||
| 62 | + | ||
| 63 | +short __ovld __conv sub_group_broadcast( short value, uint index ); | ||
| 64 | +short2 __ovld __conv sub_group_broadcast( short2 value, uint index ); | ||
| 65 | +short3 __ovld __conv sub_group_broadcast( short3 value, uint index ); | ||
| 66 | +short4 __ovld __conv sub_group_broadcast( short4 value, uint index ); | ||
| 67 | +short8 __ovld __conv sub_group_broadcast( short8 value, uint index ); | ||
| 68 | +short16 __ovld __conv sub_group_broadcast( short16 value, uint index ); | ||
| 69 | + | ||
| 70 | +ushort __ovld __conv sub_group_broadcast( ushort value, uint index ); | ||
| 71 | +ushort2 __ovld __conv sub_group_broadcast( ushort2 value, uint index ); | ||
| 72 | +ushort3 __ovld __conv sub_group_broadcast( ushort3 value, uint index ); | ||
| 73 | +ushort4 __ovld __conv sub_group_broadcast( ushort4 value, uint index ); | ||
| 74 | +ushort8 __ovld __conv sub_group_broadcast( ushort8 value, uint index ); | ||
| 75 | +ushort16 __ovld __conv sub_group_broadcast( ushort16 value, uint index ); | ||
| 76 | + | ||
| 77 | +// scalar int broadcast is part of cl_khr_subgroups | ||
| 78 | +int2 __ovld __conv sub_group_broadcast( int2 value, uint index ); | ||
| 79 | +int3 __ovld __conv sub_group_broadcast( int3 value, uint index ); | ||
| 80 | +int4 __ovld __conv sub_group_broadcast( int4 value, uint index ); | ||
| 81 | +int8 __ovld __conv sub_group_broadcast( int8 value, uint index ); | ||
| 82 | +int16 __ovld __conv sub_group_broadcast( int16 value, uint index ); | ||
| 83 | + | ||
| 84 | +// scalar uint broadcast is part of cl_khr_subgroups | ||
| 85 | +uint2 __ovld __conv sub_group_broadcast( uint2 value, uint index ); | ||
| 86 | +uint3 __ovld __conv sub_group_broadcast( uint3 value, uint index ); | ||
| 87 | +uint4 __ovld __conv sub_group_broadcast( uint4 value, uint index ); | ||
| 88 | +uint8 __ovld __conv sub_group_broadcast( uint8 value, uint index ); | ||
| 89 | +uint16 __ovld __conv sub_group_broadcast( uint16 value, uint index ); | ||
| 90 | + | ||
| 91 | +// scalar long broadcast is part of cl_khr_subgroups | ||
| 92 | +long2 __ovld __conv sub_group_broadcast( long2 value, uint index ); | ||
| 93 | +long3 __ovld __conv sub_group_broadcast( long3 value, uint index ); | ||
| 94 | +long4 __ovld __conv sub_group_broadcast( long4 value, uint index ); | ||
| 95 | +long8 __ovld __conv sub_group_broadcast( long8 value, uint index ); | ||
| 96 | +long16 __ovld __conv sub_group_broadcast( long16 value, uint index ); | ||
| 97 | + | ||
| 98 | +// scalar ulong broadcast is part of cl_khr_subgroups | ||
| 99 | +ulong2 __ovld __conv sub_group_broadcast( ulong2 value, uint index ); | ||
| 100 | +ulong3 __ovld __conv sub_group_broadcast( ulong3 value, uint index ); | ||
| 101 | +ulong4 __ovld __conv sub_group_broadcast( ulong4 value, uint index ); | ||
| 102 | +ulong8 __ovld __conv sub_group_broadcast( ulong8 value, uint index ); | ||
| 103 | +ulong16 __ovld __conv sub_group_broadcast( ulong16 value, uint index ); | ||
| 104 | + | ||
| 105 | +// scalar float broadcast is part of cl_khr_subgroups | ||
| 106 | +float2 __ovld __conv sub_group_broadcast( float2 value, uint index ); | ||
| 107 | +float3 __ovld __conv sub_group_broadcast( float3 value, uint index ); | ||
| 108 | +float4 __ovld __conv sub_group_broadcast( float4 value, uint index ); | ||
| 109 | +float8 __ovld __conv sub_group_broadcast( float8 value, uint index ); | ||
| 110 | +float16 __ovld __conv sub_group_broadcast( float16 value, uint index ); | ||
| 111 | + | ||
| 112 | +char __ovld __conv sub_group_reduce_add( char value ); | ||
| 113 | +uchar __ovld __conv sub_group_reduce_add( uchar value ); | ||
| 114 | +short __ovld __conv sub_group_reduce_add( short value ); | ||
| 115 | +ushort __ovld __conv sub_group_reduce_add( ushort value ); | ||
| 116 | + | ||
| 117 | +char __ovld __conv sub_group_reduce_min( char value ); | ||
| 118 | +uchar __ovld __conv sub_group_reduce_min( uchar value ); | ||
| 119 | +short __ovld __conv sub_group_reduce_min( short value ); | ||
| 120 | +ushort __ovld __conv sub_group_reduce_min( ushort value ); | ||
| 121 | + | ||
| 122 | +char __ovld __conv sub_group_reduce_max( char value ); | ||
| 123 | +uchar __ovld __conv sub_group_reduce_max( uchar value ); | ||
| 124 | +short __ovld __conv sub_group_reduce_max( short value ); | ||
| 125 | +ushort __ovld __conv sub_group_reduce_max( ushort value ); | ||
| 126 | + | ||
| 127 | +char __ovld __conv sub_group_scan_inclusive_add( char value ); | ||
| 128 | +uchar __ovld __conv sub_group_scan_inclusive_add( uchar value ); | ||
| 129 | +short __ovld __conv sub_group_scan_inclusive_add( short value ); | ||
| 130 | +ushort __ovld __conv sub_group_scan_inclusive_add( ushort value ); | ||
| 131 | + | ||
| 132 | +char __ovld __conv sub_group_scan_inclusive_min( char value ); | ||
| 133 | +uchar __ovld __conv sub_group_scan_inclusive_min( uchar value ); | ||
| 134 | +short __ovld __conv sub_group_scan_inclusive_min( short value ); | ||
| 135 | +ushort __ovld __conv sub_group_scan_inclusive_min( ushort value ); | ||
| 136 | + | ||
| 137 | +char __ovld __conv sub_group_scan_inclusive_max( char value ); | ||
| 138 | +uchar __ovld __conv sub_group_scan_inclusive_max( uchar value ); | ||
| 139 | +short __ovld __conv sub_group_scan_inclusive_max( short value ); | ||
| 140 | +ushort __ovld __conv sub_group_scan_inclusive_max( ushort value ); | ||
| 141 | + | ||
| 142 | +char __ovld __conv sub_group_scan_exclusive_add( char value ); | ||
| 143 | +uchar __ovld __conv sub_group_scan_exclusive_add( uchar value ); | ||
| 144 | +short __ovld __conv sub_group_scan_exclusive_add( short value ); | ||
| 145 | +ushort __ovld __conv sub_group_scan_exclusive_add( ushort value ); | ||
| 146 | + | ||
| 147 | +char __ovld __conv sub_group_scan_exclusive_min( char value ); | ||
| 148 | +uchar __ovld __conv sub_group_scan_exclusive_min( uchar value ); | ||
| 149 | +short __ovld __conv sub_group_scan_exclusive_min( short value ); | ||
| 150 | +ushort __ovld __conv sub_group_scan_exclusive_min( ushort value ); | ||
| 151 | + | ||
| 152 | +char __ovld __conv sub_group_scan_exclusive_max( char value ); | ||
| 153 | +uchar __ovld __conv sub_group_scan_exclusive_max( uchar value ); | ||
| 154 | +short __ovld __conv sub_group_scan_exclusive_max( short value ); | ||
| 155 | +ushort __ovld __conv sub_group_scan_exclusive_max( ushort value ); | ||
| 156 | + | ||
| 157 | +#if defined(cl_khr_fp16) | ||
| 158 | +// scalar half broadcast is part of cl_khr_subgroups | ||
| 159 | +half2 __ovld __conv sub_group_broadcast( half2 value, uint index ); | ||
| 160 | +half3 __ovld __conv sub_group_broadcast( half3 value, uint index ); | ||
| 161 | +half4 __ovld __conv sub_group_broadcast( half4 value, uint index ); | ||
| 162 | +half8 __ovld __conv sub_group_broadcast( half8 value, uint index ); | ||
| 163 | +half16 __ovld __conv sub_group_broadcast( half16 value, uint index ); | ||
| 164 | +#endif // cl_khr_fp16 | ||
| 165 | + | ||
| 166 | +#if defined(cl_khr_fp64) | ||
| 167 | +// scalar double broadcast is part of cl_khr_subgroups | ||
| 168 | +double2 __ovld __conv sub_group_broadcast( double2 value, uint index ); | ||
| 169 | +double3 __ovld __conv sub_group_broadcast( double3 value, uint index ); | ||
| 170 | +double4 __ovld __conv sub_group_broadcast( double4 value, uint index ); | ||
| 171 | +double8 __ovld __conv sub_group_broadcast( double8 value, uint index ); | ||
| 172 | +double16 __ovld __conv sub_group_broadcast( double16 value, uint index ); | ||
| 173 | +#endif // cl_khr_fp64 | ||
| 174 | + | ||
| 175 | +#endif // cl_khr_subgroup_extended_types | ||
| 176 | + | ||
| 177 | +#if defined(cl_khr_subgroup_non_uniform_vote) | ||
| 178 | +int __ovld sub_group_elect(void); | ||
| 179 | +int __ovld sub_group_non_uniform_all( int predicate ); | ||
| 180 | +int __ovld sub_group_non_uniform_any( int predicate ); | ||
| 181 | + | ||
| 182 | +int __ovld sub_group_non_uniform_all_equal( char value ); | ||
| 183 | +int __ovld sub_group_non_uniform_all_equal( uchar value ); | ||
| 184 | +int __ovld sub_group_non_uniform_all_equal( short value ); | ||
| 185 | +int __ovld sub_group_non_uniform_all_equal( ushort value ); | ||
| 186 | +int __ovld sub_group_non_uniform_all_equal( int value ); | ||
| 187 | +int __ovld sub_group_non_uniform_all_equal( uint value ); | ||
| 188 | +int __ovld sub_group_non_uniform_all_equal( long value ); | ||
| 189 | +int __ovld sub_group_non_uniform_all_equal( ulong value ); | ||
| 190 | +int __ovld sub_group_non_uniform_all_equal( float value ); | ||
| 191 | + | ||
| 192 | +#if defined(cl_khr_fp16) | ||
| 193 | +int __ovld sub_group_non_uniform_all_equal( half value ); | ||
| 194 | +#endif // cl_khr_fp16 | ||
| 195 | + | ||
| 196 | +#if defined(cl_khr_fp64) | ||
| 197 | +int __ovld sub_group_non_uniform_all_equal( double value ); | ||
| 198 | +#endif // cl_khr_fp64 | ||
| 199 | + | ||
| 200 | +#endif // cl_khr_subgroup_non_uniform_vote | ||
| 201 | + | ||
| 202 | +#if defined(cl_khr_subgroup_ballot) | ||
| 203 | +char __ovld sub_group_non_uniform_broadcast( char value, uint index ); | ||
| 204 | +char2 __ovld sub_group_non_uniform_broadcast( char2 value, uint index ); | ||
| 205 | +char3 __ovld sub_group_non_uniform_broadcast( char3 value, uint index ); | ||
| 206 | +char4 __ovld sub_group_non_uniform_broadcast( char4 value, uint index ); | ||
| 207 | +char8 __ovld sub_group_non_uniform_broadcast( char8 value, uint index ); | ||
| 208 | +char16 __ovld sub_group_non_uniform_broadcast( char16 value, uint index ); | ||
| 209 | + | ||
| 210 | +uchar __ovld sub_group_non_uniform_broadcast( uchar value, uint index ); | ||
| 211 | +uchar2 __ovld sub_group_non_uniform_broadcast( uchar2 value, uint index ); | ||
| 212 | +uchar3 __ovld sub_group_non_uniform_broadcast( uchar3 value, uint index ); | ||
| 213 | +uchar4 __ovld sub_group_non_uniform_broadcast( uchar4 value, uint index ); | ||
| 214 | +uchar8 __ovld sub_group_non_uniform_broadcast( uchar8 value, uint index ); | ||
| 215 | +uchar16 __ovld sub_group_non_uniform_broadcast( uchar16 value, uint index ); | ||
| 216 | + | ||
| 217 | +short __ovld sub_group_non_uniform_broadcast( short value, uint index ); | ||
| 218 | +short2 __ovld sub_group_non_uniform_broadcast( short2 value, uint index ); | ||
| 219 | +short3 __ovld sub_group_non_uniform_broadcast( short3 value, uint index ); | ||
| 220 | +short4 __ovld sub_group_non_uniform_broadcast( short4 value, uint index ); | ||
| 221 | +short8 __ovld sub_group_non_uniform_broadcast( short8 value, uint index ); | ||
| 222 | +short16 __ovld sub_group_non_uniform_broadcast( short16 value, uint index ); | ||
| 223 | + | ||
| 224 | +ushort __ovld sub_group_non_uniform_broadcast( ushort value, uint index ); | ||
| 225 | +ushort2 __ovld sub_group_non_uniform_broadcast( ushort2 value, uint index ); | ||
| 226 | +ushort3 __ovld sub_group_non_uniform_broadcast( ushort3 value, uint index ); | ||
| 227 | +ushort4 __ovld sub_group_non_uniform_broadcast( ushort4 value, uint index ); | ||
| 228 | +ushort8 __ovld sub_group_non_uniform_broadcast( ushort8 value, uint index ); | ||
| 229 | +ushort16 __ovld sub_group_non_uniform_broadcast( ushort16 value, uint index ); | ||
| 230 | + | ||
| 231 | +int __ovld sub_group_non_uniform_broadcast( int value, uint index ); | ||
| 232 | +int2 __ovld sub_group_non_uniform_broadcast( int2 value, uint index ); | ||
| 233 | +int3 __ovld sub_group_non_uniform_broadcast( int3 value, uint index ); | ||
| 234 | +int4 __ovld sub_group_non_uniform_broadcast( int4 value, uint index ); | ||
| 235 | +int8 __ovld sub_group_non_uniform_broadcast( int8 value, uint index ); | ||
| 236 | +int16 __ovld sub_group_non_uniform_broadcast( int16 value, uint index ); | ||
| 237 | + | ||
| 238 | +uint __ovld sub_group_non_uniform_broadcast( uint value, uint index ); | ||
| 239 | +uint2 __ovld sub_group_non_uniform_broadcast( uint2 value, uint index ); | ||
| 240 | +uint3 __ovld sub_group_non_uniform_broadcast( uint3 value, uint index ); | ||
| 241 | +uint4 __ovld sub_group_non_uniform_broadcast( uint4 value, uint index ); | ||
| 242 | +uint8 __ovld sub_group_non_uniform_broadcast( uint8 value, uint index ); | ||
| 243 | +uint16 __ovld sub_group_non_uniform_broadcast( uint16 value, uint index ); | ||
| 244 | + | ||
| 245 | +long __ovld sub_group_non_uniform_broadcast( long value, uint index ); | ||
| 246 | +long2 __ovld sub_group_non_uniform_broadcast( long2 value, uint index ); | ||
| 247 | +long3 __ovld sub_group_non_uniform_broadcast( long3 value, uint index ); | ||
| 248 | +long4 __ovld sub_group_non_uniform_broadcast( long4 value, uint index ); | ||
| 249 | +long8 __ovld sub_group_non_uniform_broadcast( long8 value, uint index ); | ||
| 250 | +long16 __ovld sub_group_non_uniform_broadcast( long16 value, uint index ); | ||
| 251 | + | ||
| 252 | +ulong __ovld sub_group_non_uniform_broadcast( ulong value, uint index ); | ||
| 253 | +ulong2 __ovld sub_group_non_uniform_broadcast( ulong2 value, uint index ); | ||
| 254 | +ulong3 __ovld sub_group_non_uniform_broadcast( ulong3 value, uint index ); | ||
| 255 | +ulong4 __ovld sub_group_non_uniform_broadcast( ulong4 value, uint index ); | ||
| 256 | +ulong8 __ovld sub_group_non_uniform_broadcast( ulong8 value, uint index ); | ||
| 257 | +ulong16 __ovld sub_group_non_uniform_broadcast( ulong16 value, uint index ); | ||
| 258 | + | ||
| 259 | +float __ovld sub_group_non_uniform_broadcast( float value, uint index ); | ||
| 260 | +float2 __ovld sub_group_non_uniform_broadcast( float2 value, uint index ); | ||
| 261 | +float3 __ovld sub_group_non_uniform_broadcast( float3 value, uint index ); | ||
| 262 | +float4 __ovld sub_group_non_uniform_broadcast( float4 value, uint index ); | ||
| 263 | +float8 __ovld sub_group_non_uniform_broadcast( float8 value, uint index ); | ||
| 264 | +float16 __ovld sub_group_non_uniform_broadcast( float16 value, uint index ); | ||
| 265 | + | ||
| 266 | +char __ovld sub_group_broadcast_first( char value ); | ||
| 267 | +uchar __ovld sub_group_broadcast_first( uchar value ); | ||
| 268 | +short __ovld sub_group_broadcast_first( short value ); | ||
| 269 | +ushort __ovld sub_group_broadcast_first( ushort value ); | ||
| 270 | +int __ovld sub_group_broadcast_first( int value ); | ||
| 271 | +uint __ovld sub_group_broadcast_first( uint value ); | ||
| 272 | +long __ovld sub_group_broadcast_first( long value ); | ||
| 273 | +ulong __ovld sub_group_broadcast_first( ulong value ); | ||
| 274 | +float __ovld sub_group_broadcast_first( float value ); | ||
| 275 | + | ||
| 276 | +uint4 __ovld sub_group_ballot( int predicate ); | ||
| 277 | +int __ovld __cnfn sub_group_inverse_ballot( uint4 value ); | ||
| 278 | +int __ovld __cnfn sub_group_ballot_bit_extract( uint4 value, uint index ); | ||
| 279 | +uint __ovld __cnfn sub_group_ballot_bit_count( uint4 value ); | ||
| 280 | + | ||
| 281 | +uint __ovld sub_group_ballot_inclusive_scan( uint4 value ); | ||
| 282 | +uint __ovld sub_group_ballot_exclusive_scan( uint4 value ); | ||
| 283 | +uint __ovld sub_group_ballot_find_lsb( uint4 value ); | ||
| 284 | +uint __ovld sub_group_ballot_find_msb( uint4 value ); | ||
| 285 | + | ||
| 286 | +uint4 __ovld __cnfn get_sub_group_eq_mask(void); | ||
| 287 | +uint4 __ovld __cnfn get_sub_group_ge_mask(void); | ||
| 288 | +uint4 __ovld __cnfn get_sub_group_gt_mask(void); | ||
| 289 | +uint4 __ovld __cnfn get_sub_group_le_mask(void); | ||
| 290 | +uint4 __ovld __cnfn get_sub_group_lt_mask(void); | ||
| 291 | + | ||
| 292 | +#if defined(cl_khr_fp16) | ||
| 293 | +half __ovld sub_group_non_uniform_broadcast( half value, uint index ); | ||
| 294 | +half2 __ovld sub_group_non_uniform_broadcast( half2 value, uint index ); | ||
| 295 | +half3 __ovld sub_group_non_uniform_broadcast( half3 value, uint index ); | ||
| 296 | +half4 __ovld sub_group_non_uniform_broadcast( half4 value, uint index ); | ||
| 297 | +half8 __ovld sub_group_non_uniform_broadcast( half8 value, uint index ); | ||
| 298 | +half16 __ovld sub_group_non_uniform_broadcast( half16 value, uint index ); | ||
| 299 | + | ||
| 300 | +half __ovld sub_group_broadcast_first( half value ); | ||
| 301 | +#endif // cl_khr_fp16 | ||
| 302 | + | ||
| 303 | +#if defined(cl_khr_fp64) | ||
| 304 | +double __ovld sub_group_non_uniform_broadcast( double value, uint index ); | ||
| 305 | +double2 __ovld sub_group_non_uniform_broadcast( double2 value, uint index ); | ||
| 306 | +double3 __ovld sub_group_non_uniform_broadcast( double3 value, uint index ); | ||
| 307 | +double4 __ovld sub_group_non_uniform_broadcast( double4 value, uint index ); | ||
| 308 | +double8 __ovld sub_group_non_uniform_broadcast( double8 value, uint index ); | ||
| 309 | +double16 __ovld sub_group_non_uniform_broadcast( double16 value, uint index ); | ||
| 310 | + | ||
| 311 | +double __ovld sub_group_broadcast_first( double value ); | ||
| 312 | +#endif // cl_khr_fp64 | ||
| 313 | + | ||
| 314 | +#endif // cl_khr_subgroup_ballot | ||
| 315 | + | ||
| 316 | +#if defined(cl_khr_subgroup_non_uniform_arithmetic) | ||
| 317 | +char __ovld sub_group_non_uniform_reduce_add( char value ); | ||
| 318 | +uchar __ovld sub_group_non_uniform_reduce_add( uchar value ); | ||
| 319 | +short __ovld sub_group_non_uniform_reduce_add( short value ); | ||
| 320 | +ushort __ovld sub_group_non_uniform_reduce_add( ushort value ); | ||
| 321 | +int __ovld sub_group_non_uniform_reduce_add( int value ); | ||
| 322 | +uint __ovld sub_group_non_uniform_reduce_add( uint value ); | ||
| 323 | +long __ovld sub_group_non_uniform_reduce_add( long value ); | ||
| 324 | +ulong __ovld sub_group_non_uniform_reduce_add( ulong value ); | ||
| 325 | +float __ovld sub_group_non_uniform_reduce_add( float value ); | ||
| 326 | + | ||
| 327 | +char __ovld sub_group_non_uniform_reduce_mul( char value ); | ||
| 328 | +uchar __ovld sub_group_non_uniform_reduce_mul( uchar value ); | ||
| 329 | +short __ovld sub_group_non_uniform_reduce_mul( short value ); | ||
| 330 | +ushort __ovld sub_group_non_uniform_reduce_mul( ushort value ); | ||
| 331 | +int __ovld sub_group_non_uniform_reduce_mul( int value ); | ||
| 332 | +uint __ovld sub_group_non_uniform_reduce_mul( uint value ); | ||
| 333 | +long __ovld sub_group_non_uniform_reduce_mul( long value ); | ||
| 334 | +ulong __ovld sub_group_non_uniform_reduce_mul( ulong value ); | ||
| 335 | +float __ovld sub_group_non_uniform_reduce_mul( float value ); | ||
| 336 | + | ||
| 337 | +char __ovld sub_group_non_uniform_reduce_min( char value ); | ||
| 338 | +uchar __ovld sub_group_non_uniform_reduce_min( uchar value ); | ||
| 339 | +short __ovld sub_group_non_uniform_reduce_min( short value ); | ||
| 340 | +ushort __ovld sub_group_non_uniform_reduce_min( ushort value ); | ||
| 341 | +int __ovld sub_group_non_uniform_reduce_min( int value ); | ||
| 342 | +uint __ovld sub_group_non_uniform_reduce_min( uint value ); | ||
| 343 | +long __ovld sub_group_non_uniform_reduce_min( long value ); | ||
| 344 | +ulong __ovld sub_group_non_uniform_reduce_min( ulong value ); | ||
| 345 | +float __ovld sub_group_non_uniform_reduce_min( float value ); | ||
| 346 | + | ||
| 347 | +char __ovld sub_group_non_uniform_reduce_max( char value ); | ||
| 348 | +uchar __ovld sub_group_non_uniform_reduce_max( uchar value ); | ||
| 349 | +short __ovld sub_group_non_uniform_reduce_max( short value ); | ||
| 350 | +ushort __ovld sub_group_non_uniform_reduce_max( ushort value ); | ||
| 351 | +int __ovld sub_group_non_uniform_reduce_max( int value ); | ||
| 352 | +uint __ovld sub_group_non_uniform_reduce_max( uint value ); | ||
| 353 | +long __ovld sub_group_non_uniform_reduce_max( long value ); | ||
| 354 | +ulong __ovld sub_group_non_uniform_reduce_max( ulong value ); | ||
| 355 | +float __ovld sub_group_non_uniform_reduce_max( float value ); | ||
| 356 | + | ||
| 357 | +char __ovld sub_group_non_uniform_scan_inclusive_add( char value ); | ||
| 358 | +uchar __ovld sub_group_non_uniform_scan_inclusive_add( uchar value ); | ||
| 359 | +short __ovld sub_group_non_uniform_scan_inclusive_add( short value ); | ||
| 360 | +ushort __ovld sub_group_non_uniform_scan_inclusive_add( ushort value ); | ||
| 361 | +int __ovld sub_group_non_uniform_scan_inclusive_add( int value ); | ||
| 362 | +uint __ovld sub_group_non_uniform_scan_inclusive_add( uint value ); | ||
| 363 | +long __ovld sub_group_non_uniform_scan_inclusive_add( long value ); | ||
| 364 | +ulong __ovld sub_group_non_uniform_scan_inclusive_add( ulong value ); | ||
| 365 | +float __ovld sub_group_non_uniform_scan_inclusive_add( float value ); | ||
| 366 | + | ||
| 367 | +char __ovld sub_group_non_uniform_scan_inclusive_mul( char value ); | ||
| 368 | +uchar __ovld sub_group_non_uniform_scan_inclusive_mul( uchar value ); | ||
| 369 | +short __ovld sub_group_non_uniform_scan_inclusive_mul( short value ); | ||
| 370 | +ushort __ovld sub_group_non_uniform_scan_inclusive_mul( ushort value ); | ||
| 371 | +int __ovld sub_group_non_uniform_scan_inclusive_mul( int value ); | ||
| 372 | +uint __ovld sub_group_non_uniform_scan_inclusive_mul( uint value ); | ||
| 373 | +long __ovld sub_group_non_uniform_scan_inclusive_mul( long value ); | ||
| 374 | +ulong __ovld sub_group_non_uniform_scan_inclusive_mul( ulong value ); | ||
| 375 | +float __ovld sub_group_non_uniform_scan_inclusive_mul( float value ); | ||
| 376 | + | ||
| 377 | +char __ovld sub_group_non_uniform_scan_inclusive_min( char value ); | ||
| 378 | +uchar __ovld sub_group_non_uniform_scan_inclusive_min( uchar value ); | ||
| 379 | +short __ovld sub_group_non_uniform_scan_inclusive_min( short value ); | ||
| 380 | +ushort __ovld sub_group_non_uniform_scan_inclusive_min( ushort value ); | ||
| 381 | +int __ovld sub_group_non_uniform_scan_inclusive_min( int value ); | ||
| 382 | +uint __ovld sub_group_non_uniform_scan_inclusive_min( uint value ); | ||
| 383 | +long __ovld sub_group_non_uniform_scan_inclusive_min( long value ); | ||
| 384 | +ulong __ovld sub_group_non_uniform_scan_inclusive_min( ulong value ); | ||
| 385 | +float __ovld sub_group_non_uniform_scan_inclusive_min( float value ); | ||
| 386 | + | ||
| 387 | +char __ovld sub_group_non_uniform_scan_inclusive_max( char value ); | ||
| 388 | +uchar __ovld sub_group_non_uniform_scan_inclusive_max( uchar value ); | ||
| 389 | +short __ovld sub_group_non_uniform_scan_inclusive_max( short value ); | ||
| 390 | +ushort __ovld sub_group_non_uniform_scan_inclusive_max( ushort value ); | ||
| 391 | +int __ovld sub_group_non_uniform_scan_inclusive_max( int value ); | ||
| 392 | +uint __ovld sub_group_non_uniform_scan_inclusive_max( uint value ); | ||
| 393 | +long __ovld sub_group_non_uniform_scan_inclusive_max( long value ); | ||
| 394 | +ulong __ovld sub_group_non_uniform_scan_inclusive_max( ulong value ); | ||
| 395 | +float __ovld sub_group_non_uniform_scan_inclusive_max( float value ); | ||
| 396 | + | ||
| 397 | +char __ovld sub_group_non_uniform_scan_exclusive_add( char value ); | ||
| 398 | +uchar __ovld sub_group_non_uniform_scan_exclusive_add( uchar value ); | ||
| 399 | +short __ovld sub_group_non_uniform_scan_exclusive_add( short value ); | ||
| 400 | +ushort __ovld sub_group_non_uniform_scan_exclusive_add( ushort value ); | ||
| 401 | +int __ovld sub_group_non_uniform_scan_exclusive_add( int value ); | ||
| 402 | +uint __ovld sub_group_non_uniform_scan_exclusive_add( uint value ); | ||
| 403 | +long __ovld sub_group_non_uniform_scan_exclusive_add( long value ); | ||
| 404 | +ulong __ovld sub_group_non_uniform_scan_exclusive_add( ulong value ); | ||
| 405 | +float __ovld sub_group_non_uniform_scan_exclusive_add( float value ); | ||
| 406 | + | ||
| 407 | +char __ovld sub_group_non_uniform_scan_exclusive_mul( char value ); | ||
| 408 | +uchar __ovld sub_group_non_uniform_scan_exclusive_mul( uchar value ); | ||
| 409 | +short __ovld sub_group_non_uniform_scan_exclusive_mul( short value ); | ||
| 410 | +ushort __ovld sub_group_non_uniform_scan_exclusive_mul( ushort value ); | ||
| 411 | +int __ovld sub_group_non_uniform_scan_exclusive_mul( int value ); | ||
| 412 | +uint __ovld sub_group_non_uniform_scan_exclusive_mul( uint value ); | ||
| 413 | +long __ovld sub_group_non_uniform_scan_exclusive_mul( long value ); | ||
| 414 | +ulong __ovld sub_group_non_uniform_scan_exclusive_mul( ulong value ); | ||
| 415 | +float __ovld sub_group_non_uniform_scan_exclusive_mul( float value ); | ||
| 416 | + | ||
| 417 | +char __ovld sub_group_non_uniform_scan_exclusive_min( char value ); | ||
| 418 | +uchar __ovld sub_group_non_uniform_scan_exclusive_min( uchar value ); | ||
| 419 | +short __ovld sub_group_non_uniform_scan_exclusive_min( short value ); | ||
| 420 | +ushort __ovld sub_group_non_uniform_scan_exclusive_min( ushort value ); | ||
| 421 | +int __ovld sub_group_non_uniform_scan_exclusive_min( int value ); | ||
| 422 | +uint __ovld sub_group_non_uniform_scan_exclusive_min( uint value ); | ||
| 423 | +long __ovld sub_group_non_uniform_scan_exclusive_min( long value ); | ||
| 424 | +ulong __ovld sub_group_non_uniform_scan_exclusive_min( ulong value ); | ||
| 425 | +float __ovld sub_group_non_uniform_scan_exclusive_min( float value ); | ||
| 426 | + | ||
| 427 | +char __ovld sub_group_non_uniform_scan_exclusive_max( char value ); | ||
| 428 | +uchar __ovld sub_group_non_uniform_scan_exclusive_max( uchar value ); | ||
| 429 | +short __ovld sub_group_non_uniform_scan_exclusive_max( short value ); | ||
| 430 | +ushort __ovld sub_group_non_uniform_scan_exclusive_max( ushort value ); | ||
| 431 | +int __ovld sub_group_non_uniform_scan_exclusive_max( int value ); | ||
| 432 | +uint __ovld sub_group_non_uniform_scan_exclusive_max( uint value ); | ||
| 433 | +long __ovld sub_group_non_uniform_scan_exclusive_max( long value ); | ||
| 434 | +ulong __ovld sub_group_non_uniform_scan_exclusive_max( ulong value ); | ||
| 435 | +float __ovld sub_group_non_uniform_scan_exclusive_max( float value ); | ||
| 436 | + | ||
| 437 | +char __ovld sub_group_non_uniform_reduce_and( char value ); | ||
| 438 | +uchar __ovld sub_group_non_uniform_reduce_and( uchar value ); | ||
| 439 | +short __ovld sub_group_non_uniform_reduce_and( short value ); | ||
| 440 | +ushort __ovld sub_group_non_uniform_reduce_and( ushort value ); | ||
| 441 | +int __ovld sub_group_non_uniform_reduce_and( int value ); | ||
| 442 | +uint __ovld sub_group_non_uniform_reduce_and( uint value ); | ||
| 443 | +long __ovld sub_group_non_uniform_reduce_and( long value ); | ||
| 444 | +ulong __ovld sub_group_non_uniform_reduce_and( ulong value ); | ||
| 445 | + | ||
| 446 | +char __ovld sub_group_non_uniform_reduce_or( char value ); | ||
| 447 | +uchar __ovld sub_group_non_uniform_reduce_or( uchar value ); | ||
| 448 | +short __ovld sub_group_non_uniform_reduce_or( short value ); | ||
| 449 | +ushort __ovld sub_group_non_uniform_reduce_or( ushort value ); | ||
| 450 | +int __ovld sub_group_non_uniform_reduce_or( int value ); | ||
| 451 | +uint __ovld sub_group_non_uniform_reduce_or( uint value ); | ||
| 452 | +long __ovld sub_group_non_uniform_reduce_or( long value ); | ||
| 453 | +ulong __ovld sub_group_non_uniform_reduce_or( ulong value ); | ||
| 454 | + | ||
| 455 | +char __ovld sub_group_non_uniform_reduce_xor( char value ); | ||
| 456 | +uchar __ovld sub_group_non_uniform_reduce_xor( uchar value ); | ||
| 457 | +short __ovld sub_group_non_uniform_reduce_xor( short value ); | ||
| 458 | +ushort __ovld sub_group_non_uniform_reduce_xor( ushort value ); | ||
| 459 | +int __ovld sub_group_non_uniform_reduce_xor( int value ); | ||
| 460 | +uint __ovld sub_group_non_uniform_reduce_xor( uint value ); | ||
| 461 | +long __ovld sub_group_non_uniform_reduce_xor( long value ); | ||
| 462 | +ulong __ovld sub_group_non_uniform_reduce_xor( ulong value ); | ||
| 463 | + | ||
| 464 | +char __ovld sub_group_non_uniform_scan_inclusive_and( char value ); | ||
| 465 | +uchar __ovld sub_group_non_uniform_scan_inclusive_and( uchar value ); | ||
| 466 | +short __ovld sub_group_non_uniform_scan_inclusive_and( short value ); | ||
| 467 | +ushort __ovld sub_group_non_uniform_scan_inclusive_and( ushort value ); | ||
| 468 | +int __ovld sub_group_non_uniform_scan_inclusive_and( int value ); | ||
| 469 | +uint __ovld sub_group_non_uniform_scan_inclusive_and( uint value ); | ||
| 470 | +long __ovld sub_group_non_uniform_scan_inclusive_and( long value ); | ||
| 471 | +ulong __ovld sub_group_non_uniform_scan_inclusive_and( ulong value ); | ||
| 472 | + | ||
| 473 | +char __ovld sub_group_non_uniform_scan_inclusive_or( char value ); | ||
| 474 | +uchar __ovld sub_group_non_uniform_scan_inclusive_or( uchar value ); | ||
| 475 | +short __ovld sub_group_non_uniform_scan_inclusive_or( short value ); | ||
| 476 | +ushort __ovld sub_group_non_uniform_scan_inclusive_or( ushort value ); | ||
| 477 | +int __ovld sub_group_non_uniform_scan_inclusive_or( int value ); | ||
| 478 | +uint __ovld sub_group_non_uniform_scan_inclusive_or( uint value ); | ||
| 479 | +long __ovld sub_group_non_uniform_scan_inclusive_or( long value ); | ||
| 480 | +ulong __ovld sub_group_non_uniform_scan_inclusive_or( ulong value ); | ||
| 481 | + | ||
| 482 | +char __ovld sub_group_non_uniform_scan_inclusive_xor( char value ); | ||
| 483 | +uchar __ovld sub_group_non_uniform_scan_inclusive_xor( uchar value ); | ||
| 484 | +short __ovld sub_group_non_uniform_scan_inclusive_xor( short value ); | ||
| 485 | +ushort __ovld sub_group_non_uniform_scan_inclusive_xor( ushort value ); | ||
| 486 | +int __ovld sub_group_non_uniform_scan_inclusive_xor( int value ); | ||
| 487 | +uint __ovld sub_group_non_uniform_scan_inclusive_xor( uint value ); | ||
| 488 | +long __ovld sub_group_non_uniform_scan_inclusive_xor( long value ); | ||
| 489 | +ulong __ovld sub_group_non_uniform_scan_inclusive_xor( ulong value ); | ||
| 490 | + | ||
| 491 | +char __ovld sub_group_non_uniform_scan_exclusive_and( char value ); | ||
| 492 | +uchar __ovld sub_group_non_uniform_scan_exclusive_and( uchar value ); | ||
| 493 | +short __ovld sub_group_non_uniform_scan_exclusive_and( short value ); | ||
| 494 | +ushort __ovld sub_group_non_uniform_scan_exclusive_and( ushort value ); | ||
| 495 | +int __ovld sub_group_non_uniform_scan_exclusive_and( int value ); | ||
| 496 | +uint __ovld sub_group_non_uniform_scan_exclusive_and( uint value ); | ||
| 497 | +long __ovld sub_group_non_uniform_scan_exclusive_and( long value ); | ||
| 498 | +ulong __ovld sub_group_non_uniform_scan_exclusive_and( ulong value ); | ||
| 499 | + | ||
| 500 | +char __ovld sub_group_non_uniform_scan_exclusive_or( char value ); | ||
| 501 | +uchar __ovld sub_group_non_uniform_scan_exclusive_or( uchar value ); | ||
| 502 | +short __ovld sub_group_non_uniform_scan_exclusive_or( short value ); | ||
| 503 | +ushort __ovld sub_group_non_uniform_scan_exclusive_or( ushort value ); | ||
| 504 | +int __ovld sub_group_non_uniform_scan_exclusive_or( int value ); | ||
| 505 | +uint __ovld sub_group_non_uniform_scan_exclusive_or( uint value ); | ||
| 506 | +long __ovld sub_group_non_uniform_scan_exclusive_or( long value ); | ||
| 507 | +ulong __ovld sub_group_non_uniform_scan_exclusive_or( ulong value ); | ||
| 508 | + | ||
| 509 | +char __ovld sub_group_non_uniform_scan_exclusive_xor( char value ); | ||
| 510 | +uchar __ovld sub_group_non_uniform_scan_exclusive_xor( uchar value ); | ||
| 511 | +short __ovld sub_group_non_uniform_scan_exclusive_xor( short value ); | ||
| 512 | +ushort __ovld sub_group_non_uniform_scan_exclusive_xor( ushort value ); | ||
| 513 | +int __ovld sub_group_non_uniform_scan_exclusive_xor( int value ); | ||
| 514 | +uint __ovld sub_group_non_uniform_scan_exclusive_xor( uint value ); | ||
| 515 | +long __ovld sub_group_non_uniform_scan_exclusive_xor( long value ); | ||
| 516 | +ulong __ovld sub_group_non_uniform_scan_exclusive_xor( ulong value ); | ||
| 517 | + | ||
| 518 | +int __ovld sub_group_non_uniform_reduce_logical_and( int predicate ); | ||
| 519 | +int __ovld sub_group_non_uniform_reduce_logical_or( int predicate ); | ||
| 520 | +int __ovld sub_group_non_uniform_reduce_logical_xor( int predicate ); | ||
| 521 | + | ||
| 522 | +int __ovld sub_group_non_uniform_scan_inclusive_logical_and( int predicate ); | ||
| 523 | +int __ovld sub_group_non_uniform_scan_inclusive_logical_or( int predicate ); | ||
| 524 | +int __ovld sub_group_non_uniform_scan_inclusive_logical_xor( int predicate ); | ||
| 525 | + | ||
| 526 | +int __ovld sub_group_non_uniform_scan_exclusive_logical_and( int predicate ); | ||
| 527 | +int __ovld sub_group_non_uniform_scan_exclusive_logical_or( int predicate ); | ||
| 528 | +int __ovld sub_group_non_uniform_scan_exclusive_logical_xor( int predicate ); | ||
| 529 | + | ||
| 530 | +#if defined(cl_khr_fp16) | ||
| 531 | +half __ovld sub_group_non_uniform_reduce_add( half value ); | ||
| 532 | +half __ovld sub_group_non_uniform_reduce_mul( half value ); | ||
| 533 | +half __ovld sub_group_non_uniform_reduce_min( half value ); | ||
| 534 | +half __ovld sub_group_non_uniform_reduce_max( half value ); | ||
| 535 | +half __ovld sub_group_non_uniform_scan_inclusive_add( half value ); | ||
| 536 | +half __ovld sub_group_non_uniform_scan_inclusive_mul( half value ); | ||
| 537 | +half __ovld sub_group_non_uniform_scan_inclusive_min( half value ); | ||
| 538 | +half __ovld sub_group_non_uniform_scan_inclusive_max( half value ); | ||
| 539 | +half __ovld sub_group_non_uniform_scan_exclusive_add( half value ); | ||
| 540 | +half __ovld sub_group_non_uniform_scan_exclusive_mul( half value ); | ||
| 541 | +half __ovld sub_group_non_uniform_scan_exclusive_min( half value ); | ||
| 542 | +half __ovld sub_group_non_uniform_scan_exclusive_max( half value ); | ||
| 543 | +#endif // cl_khr_fp16 | ||
| 544 | + | ||
| 545 | +#if defined(cl_khr_fp64) | ||
| 546 | +double __ovld sub_group_non_uniform_reduce_add( double value ); | ||
| 547 | +double __ovld sub_group_non_uniform_reduce_mul( double value ); | ||
| 548 | +double __ovld sub_group_non_uniform_reduce_min( double value ); | ||
| 549 | +double __ovld sub_group_non_uniform_reduce_max( double value ); | ||
| 550 | +double __ovld sub_group_non_uniform_scan_inclusive_add( double value ); | ||
| 551 | +double __ovld sub_group_non_uniform_scan_inclusive_mul( double value ); | ||
| 552 | +double __ovld sub_group_non_uniform_scan_inclusive_min( double value ); | ||
| 553 | +double __ovld sub_group_non_uniform_scan_inclusive_max( double value ); | ||
| 554 | +double __ovld sub_group_non_uniform_scan_exclusive_add( double value ); | ||
| 555 | +double __ovld sub_group_non_uniform_scan_exclusive_mul( double value ); | ||
| 556 | +double __ovld sub_group_non_uniform_scan_exclusive_min( double value ); | ||
| 557 | +double __ovld sub_group_non_uniform_scan_exclusive_max( double value ); | ||
| 558 | +#endif // cl_khr_fp64 | ||
| 559 | + | ||
| 560 | +#endif // cl_khr_subgroup_non_uniform_arithmetic | ||
| 561 | + | ||
| 562 | +#if defined(cl_khr_subgroup_shuffle) | ||
| 563 | +char __ovld sub_group_shuffle( char value, uint index ); | ||
| 564 | +uchar __ovld sub_group_shuffle( uchar value, uint index ); | ||
| 565 | +short __ovld sub_group_shuffle( short value, uint index ); | ||
| 566 | +ushort __ovld sub_group_shuffle( ushort value, uint index ); | ||
| 567 | +int __ovld sub_group_shuffle( int value, uint index ); | ||
| 568 | +uint __ovld sub_group_shuffle( uint value, uint index ); | ||
| 569 | +long __ovld sub_group_shuffle( long value, uint index ); | ||
| 570 | +ulong __ovld sub_group_shuffle( ulong value, uint index ); | ||
| 571 | +float __ovld sub_group_shuffle( float value, uint index ); | ||
| 572 | + | ||
| 573 | +char __ovld sub_group_shuffle_xor( char value, uint mask ); | ||
| 574 | +uchar __ovld sub_group_shuffle_xor( uchar value, uint mask ); | ||
| 575 | +short __ovld sub_group_shuffle_xor( short value, uint mask ); | ||
| 576 | +ushort __ovld sub_group_shuffle_xor( ushort value, uint mask ); | ||
| 577 | +int __ovld sub_group_shuffle_xor( int value, uint mask ); | ||
| 578 | +uint __ovld sub_group_shuffle_xor( uint value, uint mask ); | ||
| 579 | +long __ovld sub_group_shuffle_xor( long value, uint mask ); | ||
| 580 | +ulong __ovld sub_group_shuffle_xor( ulong value, uint mask ); | ||
| 581 | +float __ovld sub_group_shuffle_xor( float value, uint mask ); | ||
| 582 | + | ||
| 583 | +#if defined(cl_khr_fp16) | ||
| 584 | +half __ovld sub_group_shuffle( half value, uint index ); | ||
| 585 | +half __ovld sub_group_shuffle_xor( half value, uint mask ); | ||
| 586 | +#endif // cl_khr_fp16 | ||
| 587 | + | ||
| 588 | +#if defined(cl_khr_fp64) | ||
| 589 | +double __ovld sub_group_shuffle( double value, uint index ); | ||
| 590 | +double __ovld sub_group_shuffle_xor( double value, uint mask ); | ||
| 591 | +#endif // cl_khr_fp64 | ||
| 592 | + | ||
| 593 | +#endif // cl_khr_subgroup_shuffle | ||
| 594 | + | ||
| 595 | +#if defined(cl_khr_subgroup_shuffle_relative) | ||
| 596 | +char __ovld sub_group_shuffle_up( char value, uint delta ); | ||
| 597 | +uchar __ovld sub_group_shuffle_up( uchar value, uint delta ); | ||
| 598 | +short __ovld sub_group_shuffle_up( short value, uint delta ); | ||
| 599 | +ushort __ovld sub_group_shuffle_up( ushort value, uint delta ); | ||
| 600 | +int __ovld sub_group_shuffle_up( int value, uint delta ); | ||
| 601 | +uint __ovld sub_group_shuffle_up( uint value, uint delta ); | ||
| 602 | +long __ovld sub_group_shuffle_up( long value, uint delta ); | ||
| 603 | +ulong __ovld sub_group_shuffle_up( ulong value, uint delta ); | ||
| 604 | +float __ovld sub_group_shuffle_up( float value, uint delta ); | ||
| 605 | + | ||
| 606 | +char __ovld sub_group_shuffle_down( char value, uint delta ); | ||
| 607 | +uchar __ovld sub_group_shuffle_down( uchar value, uint delta ); | ||
| 608 | +short __ovld sub_group_shuffle_down( short value, uint delta ); | ||
| 609 | +ushort __ovld sub_group_shuffle_down( ushort value, uint delta ); | ||
| 610 | +int __ovld sub_group_shuffle_down( int value, uint delta ); | ||
| 611 | +uint __ovld sub_group_shuffle_down( uint value, uint delta ); | ||
| 612 | +long __ovld sub_group_shuffle_down( long value, uint delta ); | ||
| 613 | +ulong __ovld sub_group_shuffle_down( ulong value, uint delta ); | ||
| 614 | +float __ovld sub_group_shuffle_down( float value, uint delta ); | ||
| 615 | + | ||
| 616 | +#if defined(cl_khr_fp16) | ||
| 617 | +half __ovld sub_group_shuffle_up( half value, uint delta ); | ||
| 618 | +half __ovld sub_group_shuffle_down( half value, uint delta ); | ||
| 619 | +#endif // cl_khr_fp16 | ||
| 620 | + | ||
| 621 | +#if defined(cl_khr_fp64) | ||
| 622 | +double __ovld sub_group_shuffle_up( double value, uint delta ); | ||
| 623 | +double __ovld sub_group_shuffle_down( double value, uint delta ); | ||
| 624 | +#endif // cl_khr_fp64 | ||
| 625 | + | ||
| 626 | +#endif // cl_khr_subgroup_shuffle_relative | ||
| 627 | + | ||
| 628 | +#if defined(cl_khr_subgroup_clustered_reduce) | ||
| 629 | +char __ovld sub_group_clustered_reduce_add( char value, uint clustersize ); | ||
| 630 | +uchar __ovld sub_group_clustered_reduce_add( uchar value, uint clustersize ); | ||
| 631 | +short __ovld sub_group_clustered_reduce_add( short value, uint clustersize ); | ||
| 632 | +ushort __ovld sub_group_clustered_reduce_add( ushort value, uint clustersize ); | ||
| 633 | +int __ovld sub_group_clustered_reduce_add( int value, uint clustersize ); | ||
| 634 | +uint __ovld sub_group_clustered_reduce_add( uint value, uint clustersize ); | ||
| 635 | +long __ovld sub_group_clustered_reduce_add( long value, uint clustersize ); | ||
| 636 | +ulong __ovld sub_group_clustered_reduce_add( ulong value, uint clustersize ); | ||
| 637 | +float __ovld sub_group_clustered_reduce_add( float value, uint clustersize ); | ||
| 638 | + | ||
| 639 | +char __ovld sub_group_clustered_reduce_mul( char value, uint clustersize ); | ||
| 640 | +uchar __ovld sub_group_clustered_reduce_mul( uchar value, uint clustersize ); | ||
| 641 | +short __ovld sub_group_clustered_reduce_mul( short value, uint clustersize ); | ||
| 642 | +ushort __ovld sub_group_clustered_reduce_mul( ushort value, uint clustersize ); | ||
| 643 | +int __ovld sub_group_clustered_reduce_mul( int value, uint clustersize ); | ||
| 644 | +uint __ovld sub_group_clustered_reduce_mul( uint value, uint clustersize ); | ||
| 645 | +long __ovld sub_group_clustered_reduce_mul( long value, uint clustersize ); | ||
| 646 | +ulong __ovld sub_group_clustered_reduce_mul( ulong value, uint clustersize ); | ||
| 647 | +float __ovld sub_group_clustered_reduce_mul( float value, uint clustersize ); | ||
| 648 | + | ||
| 649 | +char __ovld sub_group_clustered_reduce_min( char value, uint clustersize ); | ||
| 650 | +uchar __ovld sub_group_clustered_reduce_min( uchar value, uint clustersize ); | ||
| 651 | +short __ovld sub_group_clustered_reduce_min( short value, uint clustersize ); | ||
| 652 | +ushort __ovld sub_group_clustered_reduce_min( ushort value, uint clustersize ); | ||
| 653 | +int __ovld sub_group_clustered_reduce_min( int value, uint clustersize ); | ||
| 654 | +uint __ovld sub_group_clustered_reduce_min( uint value, uint clustersize ); | ||
| 655 | +long __ovld sub_group_clustered_reduce_min( long value, uint clustersize ); | ||
| 656 | +ulong __ovld sub_group_clustered_reduce_min( ulong value, uint clustersize ); | ||
| 657 | +float __ovld sub_group_clustered_reduce_min( float value, uint clustersize ); | ||
| 658 | + | ||
| 659 | +char __ovld sub_group_clustered_reduce_max( char value, uint clustersize ); | ||
| 660 | +uchar __ovld sub_group_clustered_reduce_max( uchar value, uint clustersize ); | ||
| 661 | +short __ovld sub_group_clustered_reduce_max( short value, uint clustersize ); | ||
| 662 | +ushort __ovld sub_group_clustered_reduce_max( ushort value, uint clustersize ); | ||
| 663 | +int __ovld sub_group_clustered_reduce_max( int value, uint clustersize ); | ||
| 664 | +uint __ovld sub_group_clustered_reduce_max( uint value, uint clustersize ); | ||
| 665 | +long __ovld sub_group_clustered_reduce_max( long value, uint clustersize ); | ||
| 666 | +ulong __ovld sub_group_clustered_reduce_max( ulong value, uint clustersize ); | ||
| 667 | +float __ovld sub_group_clustered_reduce_max( float value, uint clustersize ); | ||
| 668 | + | ||
| 669 | +char __ovld sub_group_clustered_reduce_and( char value, uint clustersize ); | ||
| 670 | +uchar __ovld sub_group_clustered_reduce_and( uchar value, uint clustersize ); | ||
| 671 | +short __ovld sub_group_clustered_reduce_and( short value, uint clustersize ); | ||
| 672 | +ushort __ovld sub_group_clustered_reduce_and( ushort value, uint clustersize ); | ||
| 673 | +int __ovld sub_group_clustered_reduce_and( int value, uint clustersize ); | ||
| 674 | +uint __ovld sub_group_clustered_reduce_and( uint value, uint clustersize ); | ||
| 675 | +long __ovld sub_group_clustered_reduce_and( long value, uint clustersize ); | ||
| 676 | +ulong __ovld sub_group_clustered_reduce_and( ulong value, uint clustersize ); | ||
| 677 | + | ||
| 678 | +char __ovld sub_group_clustered_reduce_or( char value, uint clustersize ); | ||
| 679 | +uchar __ovld sub_group_clustered_reduce_or( uchar value, uint clustersize ); | ||
| 680 | +short __ovld sub_group_clustered_reduce_or( short value, uint clustersize ); | ||
| 681 | +ushort __ovld sub_group_clustered_reduce_or( ushort value, uint clustersize ); | ||
| 682 | +int __ovld sub_group_clustered_reduce_or( int value, uint clustersize ); | ||
| 683 | +uint __ovld sub_group_clustered_reduce_or( uint value, uint clustersize ); | ||
| 684 | +long __ovld sub_group_clustered_reduce_or( long value, uint clustersize ); | ||
| 685 | +ulong __ovld sub_group_clustered_reduce_or( ulong value, uint clustersize ); | ||
| 686 | + | ||
| 687 | +char __ovld sub_group_clustered_reduce_xor( char value, uint clustersize ); | ||
| 688 | +uchar __ovld sub_group_clustered_reduce_xor( uchar value, uint clustersize ); | ||
| 689 | +short __ovld sub_group_clustered_reduce_xor( short value, uint clustersize ); | ||
| 690 | +ushort __ovld sub_group_clustered_reduce_xor( ushort value, uint clustersize ); | ||
| 691 | +int __ovld sub_group_clustered_reduce_xor( int value, uint clustersize ); | ||
| 692 | +uint __ovld sub_group_clustered_reduce_xor( uint value, uint clustersize ); | ||
| 693 | +long __ovld sub_group_clustered_reduce_xor( long value, uint clustersize ); | ||
| 694 | +ulong __ovld sub_group_clustered_reduce_xor( ulong value, uint clustersize ); | ||
| 695 | + | ||
| 696 | +int __ovld sub_group_clustered_reduce_logical_and( int predicate, uint clustersize ); | ||
| 697 | +int __ovld sub_group_clustered_reduce_logical_or( int predicate, uint clustersize ); | ||
| 698 | +int __ovld sub_group_clustered_reduce_logical_xor( int predicate, uint clustersize ); | ||
| 699 | + | ||
| 700 | +#if defined(cl_khr_fp16) | ||
| 701 | +half __ovld sub_group_clustered_reduce_add( half value, uint clustersize ); | ||
| 702 | +half __ovld sub_group_clustered_reduce_mul( half value, uint clustersize ); | ||
| 703 | +half __ovld sub_group_clustered_reduce_min( half value, uint clustersize ); | ||
| 704 | +half __ovld sub_group_clustered_reduce_max( half value, uint clustersize ); | ||
| 705 | +#endif // cl_khr_fp16 | ||
| 706 | + | ||
| 707 | +#if defined(cl_khr_fp64) | ||
| 708 | +double __ovld sub_group_clustered_reduce_add( double value, uint clustersize ); | ||
| 709 | +double __ovld sub_group_clustered_reduce_mul( double value, uint clustersize ); | ||
| 710 | +double __ovld sub_group_clustered_reduce_min( double value, uint clustersize ); | ||
| 711 | +double __ovld sub_group_clustered_reduce_max( double value, uint clustersize ); | ||
| 712 | +#endif // cl_khr_fp64 | ||
| 713 | + | ||
| 714 | +#endif // cl_khr_subgroup_clustered_reduce | ||
| 715 | + | ||
| 716 | #if defined(cl_intel_subgroups) | ||
| 717 | // Intel-Specific Sub Group Functions | ||
| 718 | float __ovld __conv intel_sub_group_shuffle( float x, uint c ); | ||
| 719 | diff --git a/clang/test/SemaOpenCL/extension-version.cl b/clang/test/SemaOpenCL/extension-version.cl | ||
| 720 | index 0e6bbb7d3bcd..86c78143a0eb 100644 | ||
| 721 | --- a/clang/test/SemaOpenCL/extension-version.cl | ||
| 722 | +++ b/clang/test/SemaOpenCL/extension-version.cl | ||
| 723 | @@ -333,3 +333,86 @@ | ||
| 724 | #endif | ||
| 725 | #pragma OPENCL EXTENSION cl_intel_device_side_avc_motion_estimation : enable | ||
| 726 | |||
| 727 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 728 | +#ifndef cl_khr_subgroup_extended_types | ||
| 729 | +#error "Missing cl_khr_subgroup_extended_types" | ||
| 730 | +#endif | ||
| 731 | +#else | ||
| 732 | +#ifdef cl_khr_subgroup_extended_types | ||
| 733 | +#error "Incorrect cl_khr_subgroup_extended_types define" | ||
| 734 | +#endif | ||
| 735 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_extended_types' - ignoring}} | ||
| 736 | +#endif | ||
| 737 | +#pragma OPENCL EXTENSION cl_khr_subgroup_extended_types : enable | ||
| 738 | + | ||
| 739 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 740 | +#ifndef cl_khr_subgroup_non_uniform_vote | ||
| 741 | +#error "Missing cl_khr_subgroup_non_uniform_vote" | ||
| 742 | +#endif | ||
| 743 | +#else | ||
| 744 | +#ifdef cl_khr_subgroup_non_uniform_vote | ||
| 745 | +#error "Incorrect cl_khr_subgroup_non_uniform_vote define" | ||
| 746 | +#endif | ||
| 747 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_non_uniform_vote' - ignoring}} | ||
| 748 | +#endif | ||
| 749 | +#pragma OPENCL EXTENSION cl_khr_subgroup_non_uniform_vote : enable | ||
| 750 | + | ||
| 751 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 752 | +#ifndef cl_khr_subgroup_ballot | ||
| 753 | +#error "Missing cl_khr_subgroup_ballot" | ||
| 754 | +#endif | ||
| 755 | +#else | ||
| 756 | +#ifdef cl_khr_subgroup_ballot | ||
| 757 | +#error "Incorrect cl_khr_subgroup_ballot define" | ||
| 758 | +#endif | ||
| 759 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_ballot' - ignoring}} | ||
| 760 | +#endif | ||
| 761 | +#pragma OPENCL EXTENSION cl_khr_subgroup_ballot : enable | ||
| 762 | + | ||
| 763 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 764 | +#ifndef cl_khr_subgroup_non_uniform_arithmetic | ||
| 765 | +#error "Missing cl_khr_subgroup_non_uniform_arithmetic" | ||
| 766 | +#endif | ||
| 767 | +#else | ||
| 768 | +#ifdef cl_khr_subgroup_non_uniform_arithmetic | ||
| 769 | +#error "Incorrect cl_khr_subgroup_non_uniform_arithmetic define" | ||
| 770 | +#endif | ||
| 771 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_non_uniform_arithmetic' - ignoring}} | ||
| 772 | +#endif | ||
| 773 | +#pragma OPENCL EXTENSION cl_khr_subgroup_non_uniform_arithmetic : enable | ||
| 774 | + | ||
| 775 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 776 | +#ifndef cl_khr_subgroup_shuffle | ||
| 777 | +#error "Missing cl_khr_subgroup_shuffle" | ||
| 778 | +#endif | ||
| 779 | +#else | ||
| 780 | +#ifdef cl_khr_subgroup_shuffle | ||
| 781 | +#error "Incorrect cl_khr_subgroup_shuffle define" | ||
| 782 | +#endif | ||
| 783 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_shuffle' - ignoring}} | ||
| 784 | +#endif | ||
| 785 | +#pragma OPENCL EXTENSION cl_khr_subgroup_shuffle : enable | ||
| 786 | + | ||
| 787 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 788 | +#ifndef cl_khr_subgroup_shuffle_relative | ||
| 789 | +#error "Missing cl_khr_subgroup_shuffle_relative" | ||
| 790 | +#endif | ||
| 791 | +#else | ||
| 792 | +#ifdef cl_khr_subgroup_shuffle_relative | ||
| 793 | +#error "Incorrect cl_khr_subgroup_shuffle_relative define" | ||
| 794 | +#endif | ||
| 795 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_shuffle_relative' - ignoring}} | ||
| 796 | +#endif | ||
| 797 | +#pragma OPENCL EXTENSION cl_khr_subgroup_shuffle_relative : enable | ||
| 798 | + | ||
| 799 | +#if (defined(__OPENCL_CPP_VERSION__) || __OPENCL_C_VERSION__ >= 200) | ||
| 800 | +#ifndef cl_khr_subgroup_clustered_reduce | ||
| 801 | +#error "Missing cl_khr_subgroup_clustered_reduce" | ||
| 802 | +#endif | ||
| 803 | +#else | ||
| 804 | +#ifdef cl_khr_subgroup_clustered_reduce | ||
| 805 | +#error "Incorrect cl_khr_subgroup_clustered_reduce define" | ||
| 806 | +#endif | ||
| 807 | +// expected-warning@+2{{unsupported OpenCL extension 'cl_khr_subgroup_clustered_reduce' - ignoring}} | ||
| 808 | +#endif | ||
| 809 | +#pragma OPENCL EXTENSION cl_khr_subgroup_clustered_reduce : enable | ||
| 810 | -- | ||
| 811 | 2.17.1 | ||
| 812 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/BasicBlockUtils-Add-metadata-fixing-in-SplitBlockPre.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/BasicBlockUtils-Add-metadata-fixing-in-SplitBlockPre.patch deleted file mode 100644 index cd519971..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/BasicBlockUtils-Add-metadata-fixing-in-SplitBlockPre.patch +++ /dev/null | |||
| @@ -1,111 +0,0 @@ | |||
| 1 | From eeb816d95f0910bd246e37bb2bb3923acf0edf6b Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Aleksander Us <aleksander.us@intel.com> | ||
| 3 | Date: Mon, 26 Aug 2019 15:47:41 +0300 | ||
| 4 | Subject: [PATCH] [BasicBlockUtils] Add metadata fixing in | ||
| 5 | SplitBlockPredecessors. | ||
| 6 | |||
| 7 | In case when BB is header of some loop and predecessor is latch of | ||
| 8 | this loop, metadata was not attached to newly created basic block. | ||
| 9 | This led to loss of loop metadata for other passes. | ||
| 10 | |||
| 11 | Upstream-Status: Submitted [https://reviews.llvm.org/D66892] | ||
| 12 | |||
| 13 | https://github.com/intel/llvm-patches/commit/8af4449e2d201707f7f2f832b473a0439e255f32 | ||
| 14 | |||
| 15 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 16 | --- | ||
| 17 | lib/Transforms/Utils/BasicBlockUtils.cpp | 23 ++++++++---- | ||
| 18 | test/Transforms/LoopSimplify/loop_metadata.ll | 36 +++++++++++++++++++ | ||
| 19 | 2 files changed, 52 insertions(+), 7 deletions(-) | ||
| 20 | create mode 100644 test/Transforms/LoopSimplify/loop_metadata.ll | ||
| 21 | |||
| 22 | diff --git a/lib/Transforms/Utils/BasicBlockUtils.cpp b/lib/Transforms/Utils/BasicBlockUtils.cpp | ||
| 23 | index 5fa371377c8..3a90ae061fb 100644 | ||
| 24 | --- a/lib/Transforms/Utils/BasicBlockUtils.cpp | ||
| 25 | +++ b/lib/Transforms/Utils/BasicBlockUtils.cpp | ||
| 26 | @@ -579,24 +579,33 @@ BasicBlock *llvm::SplitBlockPredecessors(BasicBlock *BB, | ||
| 27 | |||
| 28 | // The new block unconditionally branches to the old block. | ||
| 29 | BranchInst *BI = BranchInst::Create(BB, NewBB); | ||
| 30 | + bool IsBBHeader = LI && LI->isLoopHeader(BB); | ||
| 31 | + Loop *BBLoop = LI ? LI->getLoopFor(BB) : nullptr; | ||
| 32 | // Splitting the predecessors of a loop header creates a preheader block. | ||
| 33 | - if (LI && LI->isLoopHeader(BB)) | ||
| 34 | + if (IsBBHeader) | ||
| 35 | // Using the loop start line number prevents debuggers stepping into the | ||
| 36 | // loop body for this instruction. | ||
| 37 | - BI->setDebugLoc(LI->getLoopFor(BB)->getStartLoc()); | ||
| 38 | + BI->setDebugLoc(BBLoop->getStartLoc()); | ||
| 39 | else | ||
| 40 | BI->setDebugLoc(BB->getFirstNonPHIOrDbg()->getDebugLoc()); | ||
| 41 | |||
| 42 | // Move the edges from Preds to point to NewBB instead of BB. | ||
| 43 | - for (unsigned i = 0, e = Preds.size(); i != e; ++i) { | ||
| 44 | + for (BasicBlock *Pred : Preds) { | ||
| 45 | + Instruction *PI = Pred->getTerminator(); | ||
| 46 | // This is slightly more strict than necessary; the minimum requirement | ||
| 47 | // is that there be no more than one indirectbr branching to BB. And | ||
| 48 | // all BlockAddress uses would need to be updated. | ||
| 49 | - assert(!isa<IndirectBrInst>(Preds[i]->getTerminator()) && | ||
| 50 | + assert(!isa<IndirectBrInst>(PI) && | ||
| 51 | "Cannot split an edge from an IndirectBrInst"); | ||
| 52 | - assert(!isa<CallBrInst>(Preds[i]->getTerminator()) && | ||
| 53 | - "Cannot split an edge from a CallBrInst"); | ||
| 54 | - Preds[i]->getTerminator()->replaceUsesOfWith(BB, NewBB); | ||
| 55 | + assert(!isa<CallBrInst>(PI) && "Cannot split an edge from a CallBrInst"); | ||
| 56 | + if (IsBBHeader && BBLoop->contains(Pred) && BBLoop->isLoopLatch(Pred)) { | ||
| 57 | + // Update loop metadata if it exists. | ||
| 58 | + if (MDNode *LoopMD = PI->getMetadata(LLVMContext::MD_loop)) { | ||
| 59 | + BI->setMetadata(LLVMContext::MD_loop, LoopMD); | ||
| 60 | + PI->setMetadata(LLVMContext::MD_loop, nullptr); | ||
| 61 | + } | ||
| 62 | + } | ||
| 63 | + PI->replaceUsesOfWith(BB, NewBB); | ||
| 64 | } | ||
| 65 | |||
| 66 | // Insert a new PHI node into NewBB for every PHI node in BB and that new PHI | ||
| 67 | diff --git a/test/Transforms/LoopSimplify/loop_metadata.ll b/test/Transforms/LoopSimplify/loop_metadata.ll | ||
| 68 | new file mode 100644 | ||
| 69 | index 00000000000..c15c92fe3ae | ||
| 70 | --- /dev/null | ||
| 71 | +++ b/test/Transforms/LoopSimplify/loop_metadata.ll | ||
| 72 | @@ -0,0 +1,36 @@ | ||
| 73 | +; RUN: opt -S -loop-simplify < %s | FileCheck %s | ||
| 74 | + | ||
| 75 | +; CHECK: for.cond.loopexit: | ||
| 76 | +; CHECK: br label %for.cond, !llvm.loop !0 | ||
| 77 | +; CHECK: br i1 %cmp1, label %for.body1, label %for.cond.loopexit | ||
| 78 | + | ||
| 79 | +define void @foo() { | ||
| 80 | +entry: | ||
| 81 | + br label %for.cond | ||
| 82 | + | ||
| 83 | +for.cond: ; preds = %for.cond1, %entry | ||
| 84 | + %j = phi i32 [ 0, %entry ], [ %add, %for.cond1 ] | ||
| 85 | + %cmp = icmp ult i32 %j, 8 | ||
| 86 | + br i1 %cmp, label %for.body, label %for.end | ||
| 87 | + | ||
| 88 | +for.body: ; preds = %for.cond | ||
| 89 | + %dummy1 = add i32 1, 1 | ||
| 90 | + %add = add nuw nsw i32 %j, 1 | ||
| 91 | + br label %for.cond1 | ||
| 92 | + | ||
| 93 | +for.cond1: ; preds = %for.body1, %for.body | ||
| 94 | + %i.0 = phi i32 [ 1, %for.body ], [ %inc, %for.body1 ] | ||
| 95 | + %cmp1 = icmp ult i32 %i.0, 8 | ||
| 96 | + br i1 %cmp1, label %for.body1, label %for.cond, !llvm.loop !0 | ||
| 97 | + | ||
| 98 | +for.body1: ; preds = %for.cond1 | ||
| 99 | + %dummy2 = add i32 1, 1 | ||
| 100 | + %inc = add nuw nsw i32 %i.0, 1 | ||
| 101 | + br label %for.cond1 | ||
| 102 | + | ||
| 103 | +for.end: ; preds = %for.cond | ||
| 104 | + ret void | ||
| 105 | +} | ||
| 106 | + | ||
| 107 | +!0 = distinct !{!0, !1} | ||
| 108 | +!1 = !{!"llvm.loop.unroll.full"} | ||
| 109 | -- | ||
| 110 | 2.18.0 | ||
| 111 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/IndVarSimplify-Do-not-use-SCEV-expander-for-IVCount-.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/IndVarSimplify-Do-not-use-SCEV-expander-for-IVCount-.patch deleted file mode 100644 index 48307deb..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/IndVarSimplify-Do-not-use-SCEV-expander-for-IVCount-.patch +++ /dev/null | |||
| @@ -1,146 +0,0 @@ | |||
| 1 | From 35e218a886f4c066eabd18685240d55270bd5a6d Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Aleksander Us <aleksander.us@intel.com> | ||
| 3 | Date: Mon, 26 Aug 2019 15:45:47 +0300 | ||
| 4 | Subject: [PATCH] [IndVarSimplify] Do not use SCEV expander for IVCount in | ||
| 5 | LFTR when possible. | ||
| 6 | |||
| 7 | SCEV analysis cannot properly cache instruction with poison flags | ||
| 8 | (for example, add nsw outside of loop will not be reused by expander). | ||
| 9 | This can lead to generating of additional instructions by SCEV expander. | ||
| 10 | |||
| 11 | Example IR: | ||
| 12 | |||
| 13 | ... | ||
| 14 | %maxval = add nuw nsw i32 %a1, %a2 | ||
| 15 | ... | ||
| 16 | for.body: | ||
| 17 | ... | ||
| 18 | %cmp22 = icmp ult i32 %ivadd, %maxval | ||
| 19 | br i1 %cmp22, label %for.body, label %for.end | ||
| 20 | ... | ||
| 21 | |||
| 22 | SCEV expander will generate copy of %maxval in preheader but without | ||
| 23 | nuw/nsw flags. This can be avoided by explicit check that iv count | ||
| 24 | value gives the same SCEV expressions as calculated by LFTR. | ||
| 25 | |||
| 26 | Upstream-Status: Submitted [https://reviews.llvm.org/D66890] | ||
| 27 | |||
| 28 | https://github.com/intel/llvm-patches/commit/fd6a6c97341a56fd21bc32bc940afea751312e8f | ||
| 29 | |||
| 30 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 31 | --- | ||
| 32 | lib/Transforms/Scalar/IndVarSimplify.cpp | 12 +++++++++- | ||
| 33 | test/Transforms/IndVarSimplify/add_nsw.ll | 23 ++++++++++++++++++++ | ||
| 34 | test/Transforms/IndVarSimplify/lftr-reuse.ll | 9 +++----- | ||
| 35 | test/Transforms/IndVarSimplify/udiv.ll | 1 + | ||
| 36 | 4 files changed, 38 insertions(+), 7 deletions(-) | ||
| 37 | create mode 100644 test/Transforms/IndVarSimplify/add_nsw.ll | ||
| 38 | |||
| 39 | diff --git a/lib/Transforms/Scalar/IndVarSimplify.cpp b/lib/Transforms/Scalar/IndVarSimplify.cpp | ||
| 40 | index f9fc698a4a9..5e04dac8aa6 100644 | ||
| 41 | --- a/lib/Transforms/Scalar/IndVarSimplify.cpp | ||
| 42 | +++ b/lib/Transforms/Scalar/IndVarSimplify.cpp | ||
| 43 | @@ -2375,6 +2375,17 @@ static Value *genLoopLimit(PHINode *IndVar, BasicBlock *ExitingBB, | ||
| 44 | if (UsePostInc) | ||
| 45 | IVLimit = SE->getAddExpr(IVLimit, SE->getOne(IVLimit->getType())); | ||
| 46 | |||
| 47 | + // If computed limit is equal to old limit then do not use SCEV expander | ||
| 48 | + // because it can lost NUW/NSW flags and create extra instructions. | ||
| 49 | + BranchInst *BI = cast<BranchInst>(ExitingBB->getTerminator()); | ||
| 50 | + if (ICmpInst *Cmp = dyn_cast<ICmpInst>(BI->getOperand(0))) { | ||
| 51 | + Value *Limit = Cmp->getOperand(0); | ||
| 52 | + if (!L->isLoopInvariant(Limit)) | ||
| 53 | + Limit = Cmp->getOperand(1); | ||
| 54 | + if (SE->getSCEV(Limit) == IVLimit) | ||
| 55 | + return Limit; | ||
| 56 | + } | ||
| 57 | + | ||
| 58 | // Expand the code for the iteration count. | ||
| 59 | assert(SE->isLoopInvariant(IVLimit, L) && | ||
| 60 | "Computed iteration count is not loop invariant!"); | ||
| 61 | @@ -2383,7 +2394,6 @@ static Value *genLoopLimit(PHINode *IndVar, BasicBlock *ExitingBB, | ||
| 62 | // SCEV expression (IVInit) for a pointer type IV value (IndVar). | ||
| 63 | Type *LimitTy = ExitCount->getType()->isPointerTy() ? | ||
| 64 | IndVar->getType() : ExitCount->getType(); | ||
| 65 | - BranchInst *BI = cast<BranchInst>(ExitingBB->getTerminator()); | ||
| 66 | return Rewriter.expandCodeFor(IVLimit, LimitTy, BI); | ||
| 67 | } | ||
| 68 | } | ||
| 69 | diff --git a/test/Transforms/IndVarSimplify/add_nsw.ll b/test/Transforms/IndVarSimplify/add_nsw.ll | ||
| 70 | new file mode 100644 | ||
| 71 | index 00000000000..abd1cbb6c51 | ||
| 72 | --- /dev/null | ||
| 73 | +++ b/test/Transforms/IndVarSimplify/add_nsw.ll | ||
| 74 | @@ -0,0 +1,23 @@ | ||
| 75 | +; RUN: opt -indvars -S %s | FileCheck %s | ||
| 76 | + | ||
| 77 | +target datalayout = "e-p:32:32-i64:64-n8:16:32" | ||
| 78 | + | ||
| 79 | +; CHECK: for.body.preheader: | ||
| 80 | +; CHECK-NOT: add | ||
| 81 | +; CHECK: for.body: | ||
| 82 | + | ||
| 83 | +define void @foo(i32 %a1, i32 %a2) { | ||
| 84 | +entry: | ||
| 85 | + %maxval = add nuw nsw i32 %a1, %a2 | ||
| 86 | + %cmp = icmp slt i32 %maxval, 1 | ||
| 87 | + br i1 %cmp, label %for.end, label %for.body | ||
| 88 | + | ||
| 89 | +for.body: ; preds = %entry, %for.body | ||
| 90 | + %j.02 = phi i32 [ 0, %entry ], [ %add31, %for.body ] | ||
| 91 | + %add31 = add nuw nsw i32 %j.02, 1 | ||
| 92 | + %cmp22 = icmp slt i32 %add31, %maxval | ||
| 93 | + br i1 %cmp22, label %for.body, label %for.end | ||
| 94 | + | ||
| 95 | +for.end: ; preds = %for.body | ||
| 96 | + ret void | ||
| 97 | +} | ||
| 98 | diff --git a/test/Transforms/IndVarSimplify/lftr-reuse.ll b/test/Transforms/IndVarSimplify/lftr-reuse.ll | ||
| 99 | index 14ae9738696..509d662b767 100644 | ||
| 100 | --- a/test/Transforms/IndVarSimplify/lftr-reuse.ll | ||
| 101 | +++ b/test/Transforms/IndVarSimplify/lftr-reuse.ll | ||
| 102 | @@ -67,11 +67,9 @@ define void @expandOuterRecurrence(i32 %arg) nounwind { | ||
| 103 | ; CHECK-NEXT: [[CMP1:%.*]] = icmp slt i32 0, [[SUB1]] | ||
| 104 | ; CHECK-NEXT: br i1 [[CMP1]], label [[OUTER_PREHEADER:%.*]], label [[EXIT:%.*]] | ||
| 105 | ; CHECK: outer.preheader: | ||
| 106 | -; CHECK-NEXT: [[TMP0:%.*]] = add i32 [[ARG]], -1 | ||
| 107 | ; CHECK-NEXT: br label [[OUTER:%.*]] | ||
| 108 | ; CHECK: outer: | ||
| 109 | -; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i32 [ [[TMP0]], [[OUTER_PREHEADER]] ], [ [[INDVARS_IV_NEXT:%.*]], [[OUTER_INC:%.*]] ] | ||
| 110 | -; CHECK-NEXT: [[I:%.*]] = phi i32 [ [[I_INC:%.*]], [[OUTER_INC]] ], [ 0, [[OUTER_PREHEADER]] ] | ||
| 111 | +; CHECK-NEXT: [[I:%.*]] = phi i32 [ [[I_INC:%.*]], [[OUTER_INC:%.*]] ], [ 0, [[OUTER_PREHEADER]] ] | ||
| 112 | ; CHECK-NEXT: [[SUB2:%.*]] = sub nsw i32 [[ARG]], [[I]] | ||
| 113 | ; CHECK-NEXT: [[SUB3:%.*]] = sub nsw i32 [[SUB2]], 1 | ||
| 114 | ; CHECK-NEXT: [[CMP2:%.*]] = icmp slt i32 0, [[SUB3]] | ||
| 115 | @@ -81,14 +79,13 @@ define void @expandOuterRecurrence(i32 %arg) nounwind { | ||
| 116 | ; CHECK: inner: | ||
| 117 | ; CHECK-NEXT: [[J:%.*]] = phi i32 [ 0, [[INNER_PH]] ], [ [[J_INC:%.*]], [[INNER]] ] | ||
| 118 | ; CHECK-NEXT: [[J_INC]] = add nuw nsw i32 [[J]], 1 | ||
| 119 | -; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i32 [[J_INC]], [[INDVARS_IV]] | ||
| 120 | +; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i32 [[J_INC]], [[SUB3]] | ||
| 121 | ; CHECK-NEXT: br i1 [[EXITCOND]], label [[INNER]], label [[OUTER_INC_LOOPEXIT:%.*]] | ||
| 122 | ; CHECK: outer.inc.loopexit: | ||
| 123 | ; CHECK-NEXT: br label [[OUTER_INC]] | ||
| 124 | ; CHECK: outer.inc: | ||
| 125 | ; CHECK-NEXT: [[I_INC]] = add nuw nsw i32 [[I]], 1 | ||
| 126 | -; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add i32 [[INDVARS_IV]], -1 | ||
| 127 | -; CHECK-NEXT: [[EXITCOND1:%.*]] = icmp ne i32 [[I_INC]], [[TMP0]] | ||
| 128 | +; CHECK-NEXT: [[EXITCOND1:%.*]] = icmp ne i32 [[I_INC]], [[SUB1]] | ||
| 129 | ; CHECK-NEXT: br i1 [[EXITCOND1]], label [[OUTER]], label [[EXIT_LOOPEXIT:%.*]] | ||
| 130 | ; CHECK: exit.loopexit: | ||
| 131 | ; CHECK-NEXT: br label [[EXIT]] | ||
| 132 | diff --git a/test/Transforms/IndVarSimplify/udiv.ll b/test/Transforms/IndVarSimplify/udiv.ll | ||
| 133 | index b3f2c2a6a66..3530343ef4a 100644 | ||
| 134 | --- a/test/Transforms/IndVarSimplify/udiv.ll | ||
| 135 | +++ b/test/Transforms/IndVarSimplify/udiv.ll | ||
| 136 | @@ -133,6 +133,7 @@ declare i32 @printf(i8* nocapture, ...) nounwind | ||
| 137 | ; CHECK-LABEL: @foo( | ||
| 138 | ; CHECK: for.body.preheader: | ||
| 139 | ; CHECK-NOT: udiv | ||
| 140 | +; CHECK: for.body: | ||
| 141 | |||
| 142 | define void @foo(double* %p, i64 %n) nounwind { | ||
| 143 | entry: | ||
| 144 | -- | ||
| 145 | 2.18.0 | ||
| 146 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/fix-shared-libs.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/fix-shared-libs.patch deleted file mode 100644 index d69d2a97..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/fix-shared-libs.patch +++ /dev/null | |||
| @@ -1,30 +0,0 @@ | |||
| 1 | From a6d4ccf082858e63e139ca06c02a071c343d2657 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Andrea Bocci <andrea.bocci@cern.ch> | ||
| 3 | Date: Sun, 15 Mar 2020 17:35:44 +0100 | ||
| 4 | Subject: [PATCH] Fix building in-tree with cmake -DLLVM_LINK_LLVM_DYLIB=ON | ||
| 5 | |||
| 6 | Building in-tree with LLVM 11.0 master with the LLVM_LINK_LLVM_DYLIB | ||
| 7 | cmake flag fails to link with the LLVMSPIRVLib library. | ||
| 8 | |||
| 9 | Add an explicit dependency to force the correct build order and linking. | ||
| 10 | |||
| 11 | Signed-off-by: Andrea Bocci <andrea.bocci@cern.ch> | ||
| 12 | Upstream-Status: Backport | ||
| 13 | Signed-off-by: Anuj Mittal <anuj.mittal@intel.com> | ||
| 14 | --- | ||
| 15 | tools/llvm-spirv/CMakeLists.txt | 2 +- | ||
| 16 | 1 file changed, 1 insertion(+), 1 deletion(-) | ||
| 17 | |||
| 18 | diff --git a/tools/llvm-spirv/CMakeLists.txt b/tools/llvm-spirv/CMakeLists.txt | ||
| 19 | index 9aa96d9c..501c0daf 100644 | ||
| 20 | --- a/tools/llvm-spirv/CMakeLists.txt | ||
| 21 | +++ b/tools/llvm-spirv/CMakeLists.txt | ||
| 22 | @@ -14,7 +14,7 @@ add_llvm_tool(llvm-spirv | ||
| 23 | NO_INSTALL_RPATH | ||
| 24 | ) | ||
| 25 | |||
| 26 | -if (LLVM_SPIRV_BUILD_EXTERNAL) | ||
| 27 | +if (LLVM_SPIRV_BUILD_EXTERNAL OR LLVM_LINK_LLVM_DYLIB) | ||
| 28 | target_link_libraries(llvm-spirv PRIVATE LLVMSPIRVLib) | ||
| 29 | endif() | ||
| 30 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-OpenCL-3.0-support.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-OpenCL-3.0-support.patch deleted file mode 100644 index 53395ea0..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-OpenCL-3.0-support.patch +++ /dev/null | |||
| @@ -1,8259 +0,0 @@ | |||
| 1 | From 31ec702cb365f4d02dd2146fb4329d642b8fc30b Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 3 | Date: Wed, 7 Apr 2021 16:36:10 +0800 | ||
| 4 | Subject: [PATCH 1/2] OpenCL 3.0 support | ||
| 5 | |||
| 6 | Upstream-Status: Backport [Taken from opencl-clang patches, https://github.com/intel/opencl-clang/blob/ocl-open-100/patches/clang/0001-OpenCL-3.0-support.patch] | ||
| 7 | Signed-off-by: Anton Zabaznov <anton.zabaznov@intel.com> | ||
| 8 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 9 | --- | ||
| 10 | clang/include/clang/Basic/Builtins.def | 65 +- | ||
| 11 | clang/include/clang/Basic/Builtins.h | 13 +- | ||
| 12 | .../clang/Basic/DiagnosticParseKinds.td | 2 + | ||
| 13 | .../clang/Basic/DiagnosticSemaKinds.td | 7 + | ||
| 14 | clang/include/clang/Basic/LangOptions.def | 2 + | ||
| 15 | clang/include/clang/Basic/LangStandards.def | 4 + | ||
| 16 | .../include/clang/Basic/OpenCLExtensions.def | 15 + | ||
| 17 | clang/include/clang/Basic/OpenCLOptions.h | 175 +- | ||
| 18 | clang/include/clang/Driver/Options.td | 2 +- | ||
| 19 | clang/include/clang/Sema/Sema.h | 9 + | ||
| 20 | clang/lib/AST/ASTContext.cpp | 3 +- | ||
| 21 | clang/lib/Basic/Builtins.cpp | 28 +- | ||
| 22 | clang/lib/Basic/TargetInfo.cpp | 11 + | ||
| 23 | clang/lib/Basic/Targets.cpp | 1 - | ||
| 24 | clang/lib/CodeGen/CodeGenFunction.cpp | 6 +- | ||
| 25 | clang/lib/Frontend/CompilerInvocation.cpp | 22 +- | ||
| 26 | clang/lib/Frontend/InitPreprocessor.cpp | 6 +- | ||
| 27 | clang/lib/Headers/opencl-c-base.h | 75 +- | ||
| 28 | clang/lib/Headers/opencl-c.h | 3228 ++++++++++++++--- | ||
| 29 | clang/lib/Parse/ParseDecl.cpp | 12 +- | ||
| 30 | clang/lib/Parse/ParsePragma.cpp | 10 +- | ||
| 31 | clang/lib/Sema/OpenCLBuiltins.td | 49 +- | ||
| 32 | clang/lib/Sema/Sema.cpp | 47 +- | ||
| 33 | clang/lib/Sema/SemaChecking.cpp | 38 +- | ||
| 34 | clang/lib/Sema/SemaDecl.cpp | 15 +- | ||
| 35 | clang/lib/Sema/SemaDeclAttr.cpp | 9 +- | ||
| 36 | clang/lib/Sema/SemaDeclCXX.cpp | 10 + | ||
| 37 | clang/lib/Sema/SemaLookup.cpp | 19 +- | ||
| 38 | clang/lib/Sema/SemaType.cpp | 14 +- | ||
| 39 | .../CodeGenOpenCL/addr-space-struct-arg.cl | 7 +- | ||
| 40 | .../address-spaces-conversions.cl | 2 + | ||
| 41 | .../CodeGenOpenCL/address-spaces-mangling.cl | 3 +- | ||
| 42 | clang/test/CodeGenOpenCL/address-spaces.cl | 4 + | ||
| 43 | .../amdgcn-automatic-variable.cl | 1 + | ||
| 44 | .../CodeGenOpenCL/amdgpu-sizeof-alignof.cl | 21 +- | ||
| 45 | .../CodeGenOpenCL/arm-integer-dot-product.cl | 1 + | ||
| 46 | .../test/CodeGenOpenCL/cl-uniform-wg-size.cl | 2 + | ||
| 47 | clang/test/CodeGenOpenCL/fpmath.cl | 2 + | ||
| 48 | .../generic-address-space-feature.cl | 28 + | ||
| 49 | .../intel-subgroups-avc-ext-types.cl | 1 + | ||
| 50 | .../kernels-have-spir-cc-by-default.cl | 3 + | ||
| 51 | clang/test/CodeGenOpenCL/logical-ops.cl | 1 + | ||
| 52 | clang/test/CodeGenOpenCL/no-half.cl | 1 + | ||
| 53 | clang/test/CodeGenOpenCL/pipe_builtin.cl | 3 + | ||
| 54 | clang/test/CodeGenOpenCL/pipe_types.cl | 1 + | ||
| 55 | clang/test/CodeGenOpenCL/printf.cl | 2 + | ||
| 56 | clang/test/CodeGenOpenCL/unroll-hint.cl | 1 + | ||
| 57 | clang/test/Driver/autocomplete.c | 2 + | ||
| 58 | clang/test/Driver/opencl.cl | 2 + | ||
| 59 | clang/test/Driver/unknown-std.cl | 1 + | ||
| 60 | clang/test/Frontend/stdlang.c | 1 + | ||
| 61 | clang/test/Headers/opencl-c-header.cl | 7 +- | ||
| 62 | clang/test/Index/pipe-size.cl | 7 + | ||
| 63 | clang/test/Preprocessor/predefined-macros.c | 13 + | ||
| 64 | .../Sema/feature-extensions-simult-support.cl | 75 + | ||
| 65 | clang/test/Sema/features-ignore-pragma.cl | 24 + | ||
| 66 | clang/test/Sema/opencl-features-pipes.cl | 18 + | ||
| 67 | clang/test/Sema/opencl-features.cl | 128 + | ||
| 68 | clang/test/Sema/pipe_builtins_feature.cl | 21 + | ||
| 69 | .../address-spaces-conversions-cl2.0.cl | 3 + | ||
| 70 | clang/test/SemaOpenCL/address-spaces.cl | 1 + | ||
| 71 | .../SemaOpenCL/cl20-device-side-enqueue.cl | 16 +- | ||
| 72 | .../SemaOpenCL/forget-unsupported-builtins.cl | 22 + | ||
| 73 | clang/test/SemaOpenCL/image-features.cl | 20 + | ||
| 74 | .../SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | 1 + | ||
| 75 | clang/test/SemaOpenCL/storageclass-cl20.cl | 1 + | ||
| 76 | .../TableGen/ClangOpenCLBuiltinEmitter.cpp | 35 +- | ||
| 77 | 67 files changed, 3656 insertions(+), 723 deletions(-) | ||
| 78 | create mode 100644 clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 79 | create mode 100644 clang/test/Sema/feature-extensions-simult-support.cl | ||
| 80 | create mode 100644 clang/test/Sema/features-ignore-pragma.cl | ||
| 81 | create mode 100644 clang/test/Sema/opencl-features-pipes.cl | ||
| 82 | create mode 100644 clang/test/Sema/opencl-features.cl | ||
| 83 | create mode 100644 clang/test/Sema/pipe_builtins_feature.cl | ||
| 84 | create mode 100644 clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 85 | create mode 100644 clang/test/SemaOpenCL/image-features.cl | ||
| 86 | |||
| 87 | diff --git a/clang/include/clang/Basic/Builtins.def b/clang/include/clang/Basic/Builtins.def | ||
| 88 | index 1a6c85ce2dd3..b76e277f0337 100644 | ||
| 89 | --- a/clang/include/clang/Basic/Builtins.def | ||
| 90 | +++ b/clang/include/clang/Basic/Builtins.def | ||
| 91 | @@ -106,6 +106,10 @@ | ||
| 92 | # define LANGBUILTIN(ID, TYPE, ATTRS, BUILTIN_LANG) BUILTIN(ID, TYPE, ATTRS) | ||
| 93 | #endif | ||
| 94 | |||
| 95 | +#if defined(BUILTIN) && !defined(OPENCLBUILTIN) | ||
| 96 | +# define OPENCLBUILTIN(ID, TYPE, ATTRS, BUILTIN_LANG, FEATURE) BUILTIN(ID, TYPE, ATTRS) | ||
| 97 | +#endif | ||
| 98 | + | ||
| 99 | // Standard libc/libm functions: | ||
| 100 | BUILTIN(__builtin_atan2 , "ddd" , "Fne") | ||
| 101 | BUILTIN(__builtin_atan2f, "fff" , "Fne") | ||
| 102 | @@ -1514,50 +1518,54 @@ BUILTIN(__builtin_coro_param, "bv*v*", "n") | ||
| 103 | |||
| 104 | // OpenCL v2.0 s6.13.16, s9.17.3.5 - Pipe functions. | ||
| 105 | // We need the generic prototype, since the packet type could be anything. | ||
| 106 | -LANGBUILTIN(read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 107 | -LANGBUILTIN(write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 108 | +OPENCLBUILTIN(read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 109 | +OPENCLBUILTIN(write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 110 | |||
| 111 | -LANGBUILTIN(reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 112 | -LANGBUILTIN(reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 113 | +OPENCLBUILTIN(reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 114 | +OPENCLBUILTIN(reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 115 | |||
| 116 | -LANGBUILTIN(commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 117 | -LANGBUILTIN(commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 118 | +OPENCLBUILTIN(commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 119 | +OPENCLBUILTIN(commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 120 | |||
| 121 | -LANGBUILTIN(sub_group_reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 122 | -LANGBUILTIN(sub_group_reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 123 | +OPENCLBUILTIN(sub_group_reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 124 | +OPENCLBUILTIN(sub_group_reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 125 | |||
| 126 | -LANGBUILTIN(sub_group_commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 127 | -LANGBUILTIN(sub_group_commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 128 | +OPENCLBUILTIN(sub_group_commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 129 | +OPENCLBUILTIN(sub_group_commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 130 | |||
| 131 | -LANGBUILTIN(work_group_reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 132 | -LANGBUILTIN(work_group_reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 133 | +OPENCLBUILTIN(work_group_reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 134 | +OPENCLBUILTIN(work_group_reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 135 | |||
| 136 | -LANGBUILTIN(work_group_commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 137 | -LANGBUILTIN(work_group_commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 138 | +OPENCLBUILTIN(work_group_commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 139 | +OPENCLBUILTIN(work_group_commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 140 | |||
| 141 | -LANGBUILTIN(get_pipe_num_packets, "Ui.", "tn", OCLC20_LANG) | ||
| 142 | -LANGBUILTIN(get_pipe_max_packets, "Ui.", "tn", OCLC20_LANG) | ||
| 143 | +OPENCLBUILTIN(get_pipe_num_packets, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 144 | +OPENCLBUILTIN(get_pipe_max_packets, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 145 | |||
| 146 | // OpenCL v2.0 s6.13.17 - Enqueue kernel functions. | ||
| 147 | // Custom builtin check allows to perform special check of passed block arguments. | ||
| 148 | -LANGBUILTIN(enqueue_kernel, "i.", "tn", OCLC20_LANG) | ||
| 149 | -LANGBUILTIN(get_kernel_work_group_size, "Ui.", "tn", OCLC20_LANG) | ||
| 150 | -LANGBUILTIN(get_kernel_preferred_work_group_size_multiple, "Ui.", "tn", OCLC20_LANG) | ||
| 151 | -LANGBUILTIN(get_kernel_max_sub_group_size_for_ndrange, "Ui.", "tn", OCLC20_LANG) | ||
| 152 | -LANGBUILTIN(get_kernel_sub_group_count_for_ndrange, "Ui.", "tn", OCLC20_LANG) | ||
| 153 | +OPENCLBUILTIN(enqueue_kernel, "i.", "tn", OCLC2P_LANG, | ||
| 154 | + "__opencl_c_device_enqueue") | ||
| 155 | +OPENCLBUILTIN(get_kernel_work_group_size, "Ui.", "tn", OCLC2P_LANG, | ||
| 156 | + "__opencl_c_device_enqueue") | ||
| 157 | +OPENCLBUILTIN(get_kernel_preferred_work_group_size_multiple, "Ui.", "tn", | ||
| 158 | + OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 159 | +OPENCLBUILTIN(get_kernel_max_sub_group_size_for_ndrange, "Ui.", "tn", | ||
| 160 | + OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 161 | +OPENCLBUILTIN(get_kernel_sub_group_count_for_ndrange, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 162 | |||
| 163 | // OpenCL v2.0 s6.13.9 - Address space qualifier functions. | ||
| 164 | // FIXME: Pointer parameters of OpenCL builtins should have their address space | ||
| 165 | // requirement defined. | ||
| 166 | -LANGBUILTIN(to_global, "v*v*", "tn", OCLC20_LANG) | ||
| 167 | -LANGBUILTIN(to_local, "v*v*", "tn", OCLC20_LANG) | ||
| 168 | -LANGBUILTIN(to_private, "v*v*", "tn", OCLC20_LANG) | ||
| 169 | +OPENCLBUILTIN(to_global, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 170 | +OPENCLBUILTIN(to_local, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 171 | +OPENCLBUILTIN(to_private, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 172 | |||
| 173 | // OpenCL half load/store builtin | ||
| 174 | -LANGBUILTIN(__builtin_store_half, "vdh*", "n", ALL_OCLC_LANGUAGES) | ||
| 175 | -LANGBUILTIN(__builtin_store_halff, "vfh*", "n", ALL_OCLC_LANGUAGES) | ||
| 176 | -LANGBUILTIN(__builtin_load_half, "dhC*", "nc", ALL_OCLC_LANGUAGES) | ||
| 177 | -LANGBUILTIN(__builtin_load_halff, "fhC*", "nc", ALL_OCLC_LANGUAGES) | ||
| 178 | +OPENCLBUILTIN(__builtin_store_half, "vdh*", "n", ALL_OCLC_LANGUAGES, "") | ||
| 179 | +OPENCLBUILTIN(__builtin_store_halff, "vfh*", "n", ALL_OCLC_LANGUAGES, "") | ||
| 180 | +OPENCLBUILTIN(__builtin_load_half, "dhC*", "nc", ALL_OCLC_LANGUAGES, "") | ||
| 181 | +OPENCLBUILTIN(__builtin_load_halff, "fhC*", "nc", ALL_OCLC_LANGUAGES, "") | ||
| 182 | |||
| 183 | // Builtins for os_log/os_trace | ||
| 184 | BUILTIN(__builtin_os_log_format_buffer_size, "zcC*.", "p:0:nut") | ||
| 185 | @@ -1578,3 +1586,4 @@ BUILTIN(__builtin_ms_va_copy, "vc*&c*&", "n") | ||
| 186 | #undef BUILTIN | ||
| 187 | #undef LIBBUILTIN | ||
| 188 | #undef LANGBUILTIN | ||
| 189 | +#undef OPENCLBUILTIN | ||
| 190 | diff --git a/clang/include/clang/Basic/Builtins.h b/clang/include/clang/Basic/Builtins.h | ||
| 191 | index e4ed482d9068..713ea4bc267d 100644 | ||
| 192 | --- a/clang/include/clang/Basic/Builtins.h | ||
| 193 | +++ b/clang/include/clang/Basic/Builtins.h | ||
| 194 | @@ -33,13 +33,13 @@ enum LanguageID { | ||
| 195 | CXX_LANG = 0x4, // builtin for cplusplus only. | ||
| 196 | OBJC_LANG = 0x8, // builtin for objective-c and objective-c++ | ||
| 197 | MS_LANG = 0x10, // builtin requires MS mode. | ||
| 198 | - OCLC20_LANG = 0x20, // builtin for OpenCL C 2.0 only. | ||
| 199 | + OCLC2P_LANG = 0x20, // builtin for OpenCL C 2.0+ versions. | ||
| 200 | OCLC1X_LANG = 0x40, // builtin for OpenCL C 1.x only. | ||
| 201 | OMP_LANG = 0x80, // builtin requires OpenMP. | ||
| 202 | ALL_LANGUAGES = C_LANG | CXX_LANG | OBJC_LANG, // builtin for all languages. | ||
| 203 | ALL_GNU_LANGUAGES = ALL_LANGUAGES | GNU_LANG, // builtin requires GNU mode. | ||
| 204 | ALL_MS_LANGUAGES = ALL_LANGUAGES | MS_LANG, // builtin requires MS mode. | ||
| 205 | - ALL_OCLC_LANGUAGES = OCLC1X_LANG | OCLC20_LANG // builtin for OCLC languages. | ||
| 206 | + ALL_OCLC_LANGUAGES = OCLC1X_LANG | OCLC2P_LANG // builtin for OCLC languages. | ||
| 207 | }; | ||
| 208 | |||
| 209 | namespace Builtin { | ||
| 210 | @@ -228,6 +228,10 @@ public: | ||
| 211 | /// for non-builtins. | ||
| 212 | bool canBeRedeclared(unsigned ID) const; | ||
| 213 | |||
| 214 | + bool requiresFeatures(unsigned ID) const { | ||
| 215 | + return requiresFeatures(getRecord(ID)); | ||
| 216 | + } | ||
| 217 | + | ||
| 218 | private: | ||
| 219 | const Info &getRecord(unsigned ID) const; | ||
| 220 | |||
| 221 | @@ -235,6 +239,11 @@ private: | ||
| 222 | bool builtinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 223 | const LangOptions &LangOpts); | ||
| 224 | |||
| 225 | + bool OclBuiltinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 226 | + const LangOptions &LangOpts) const; | ||
| 227 | + | ||
| 228 | + bool requiresFeatures(const Builtin::Info &BuiltinInfo) const; | ||
| 229 | + | ||
| 230 | /// Helper function for isPrintfLike and isScanfLike. | ||
| 231 | bool isLike(unsigned ID, unsigned &FormatIdx, bool &HasVAListArg, | ||
| 232 | const char *Fmt) const; | ||
| 233 | diff --git a/clang/include/clang/Basic/DiagnosticParseKinds.td b/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 234 | index 33adf093693f..43ea63586f91 100644 | ||
| 235 | --- a/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 236 | +++ b/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 237 | @@ -1199,6 +1199,8 @@ def warn_pragma_unsupported_extension : Warning< | ||
| 238 | "unsupported OpenCL extension %0 - ignoring">, InGroup<IgnoredPragmas>; | ||
| 239 | def warn_pragma_extension_is_core : Warning< | ||
| 240 | "OpenCL extension %0 is core feature or supported optional core feature - ignoring">, InGroup<DiagGroup<"pedantic-core-features">>, DefaultIgnore; | ||
| 241 | +def warn_opencl_pragma_feature_ignore : Warning< | ||
| 242 | + "OpenCL feature support can't be controlled via pragma, ignoring">, InGroup<IgnoredPragmas>; | ||
| 243 | |||
| 244 | // OpenCL errors. | ||
| 245 | def err_opencl_taking_function_address_parser : Error< | ||
| 246 | diff --git a/clang/include/clang/Basic/DiagnosticSemaKinds.td b/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 247 | index 917377420505..91648aa27820 100644 | ||
| 248 | --- a/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 249 | +++ b/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 250 | @@ -9378,6 +9378,13 @@ def ext_opencl_ext_vector_type_rgba_selector: ExtWarn< | ||
| 251 | def err_openclcxx_placement_new : Error< | ||
| 252 | "use of placement new requires explicit declaration">; | ||
| 253 | |||
| 254 | +def err_opencl_pipes_require_feat : Error< | ||
| 255 | + "usage of OpenCL pipes requires feature support">; | ||
| 256 | +def err_opencl_memory_scope_require_feat : Error< | ||
| 257 | + "usage of memory scope requires feature support">; | ||
| 258 | +def err_opencl_memory_ordering_require_feat : Error< | ||
| 259 | + "usage of memory ordering requires feature support">; | ||
| 260 | + | ||
| 261 | // MIG routine annotations. | ||
| 262 | def warn_mig_server_routine_does_not_return_kern_return_t : Warning< | ||
| 263 | "'mig_server_routine' attribute only applies to routines that return a kern_return_t">, | ||
| 264 | diff --git a/clang/include/clang/Basic/LangOptions.def b/clang/include/clang/Basic/LangOptions.def | ||
| 265 | index 3319a3123976..406f45c0be69 100644 | ||
| 266 | --- a/clang/include/clang/Basic/LangOptions.def | ||
| 267 | +++ b/clang/include/clang/Basic/LangOptions.def | ||
| 268 | @@ -203,6 +203,8 @@ LANGOPT(OpenCL , 1, 0, "OpenCL") | ||
| 269 | LANGOPT(OpenCLVersion , 32, 0, "OpenCL C version") | ||
| 270 | LANGOPT(OpenCLCPlusPlus , 1, 0, "C++ for OpenCL") | ||
| 271 | LANGOPT(OpenCLCPlusPlusVersion , 32, 0, "C++ for OpenCL version") | ||
| 272 | +LANGOPT(OpenCLGenericKeyword , 1, 0, "OpenCL generic keyword") | ||
| 273 | +LANGOPT(OpenCLPipeKeyword , 1, 0, "OpenCL pipe keyword") | ||
| 274 | LANGOPT(NativeHalfType , 1, 0, "Native half type support") | ||
| 275 | LANGOPT(NativeHalfArgsAndReturns, 1, 0, "Native half args and returns") | ||
| 276 | LANGOPT(HalfArgsAndReturns, 1, 0, "half args and returns") | ||
| 277 | diff --git a/clang/include/clang/Basic/LangStandards.def b/clang/include/clang/Basic/LangStandards.def | ||
| 278 | index 7f1a24db7e9b..69aaba3ff5a2 100644 | ||
| 279 | --- a/clang/include/clang/Basic/LangStandards.def | ||
| 280 | +++ b/clang/include/clang/Basic/LangStandards.def | ||
| 281 | @@ -167,6 +167,9 @@ LANGSTANDARD(opencl12, "cl1.2", | ||
| 282 | LANGSTANDARD(opencl20, "cl2.0", | ||
| 283 | OpenCL, "OpenCL 2.0", | ||
| 284 | LineComment | C99 | Digraphs | HexFloat | OpenCL) | ||
| 285 | +LANGSTANDARD(opencl30, "cl3.0", | ||
| 286 | + OpenCL, "OpenCL 3.0", | ||
| 287 | + LineComment | C99 | Digraphs | HexFloat | OpenCL) | ||
| 288 | LANGSTANDARD(openclcpp, "clc++", | ||
| 289 | OpenCL, "C++ for OpenCL", | ||
| 290 | LineComment | CPlusPlus | CPlusPlus11 | CPlusPlus14 | CPlusPlus17 | | ||
| 291 | @@ -176,6 +179,7 @@ LANGSTANDARD_ALIAS_DEPR(opencl10, "CL") | ||
| 292 | LANGSTANDARD_ALIAS_DEPR(opencl11, "CL1.1") | ||
| 293 | LANGSTANDARD_ALIAS_DEPR(opencl12, "CL1.2") | ||
| 294 | LANGSTANDARD_ALIAS_DEPR(opencl20, "CL2.0") | ||
| 295 | +LANGSTANDARD_ALIAS_DEPR(opencl30, "CL3.0") | ||
| 296 | LANGSTANDARD_ALIAS_DEPR(openclcpp, "CLC++") | ||
| 297 | |||
| 298 | // CUDA | ||
| 299 | diff --git a/clang/include/clang/Basic/OpenCLExtensions.def b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 300 | index 517481584313..608f78a13eef 100644 | ||
| 301 | --- a/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 302 | +++ b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 303 | @@ -93,6 +93,21 @@ OPENCLEXT_INTERNAL(cl_intel_subgroups, 120, ~0U) | ||
| 304 | OPENCLEXT_INTERNAL(cl_intel_subgroups_short, 120, ~0U) | ||
| 305 | OPENCLEXT_INTERNAL(cl_intel_device_side_avc_motion_estimation, 120, ~0U) | ||
| 306 | |||
| 307 | +OPENCLEXT_INTERNAL(__opencl_c_pipes, 200, ~0U) | ||
| 308 | +OPENCLEXT_INTERNAL(__opencl_c_generic_address_space, 200, ~0U) | ||
| 309 | +OPENCLEXT_INTERNAL(__opencl_c_work_group_collective_functions, 200, ~0U) | ||
| 310 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_order_acq_rel, 200, ~0U) | ||
| 311 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_order_seq_cst, 200, ~0U) | ||
| 312 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_scope_device, 200, ~0U) | ||
| 313 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_scope_all_devices, 200, ~0U) | ||
| 314 | +OPENCLEXT_INTERNAL(__opencl_c_subgroups, 200, ~0U) | ||
| 315 | +OPENCLEXT_INTERNAL(__opencl_c_3d_image_writes, 100, ~0U) | ||
| 316 | +OPENCLEXT_INTERNAL(__opencl_c_device_enqueue, 200, ~0U) | ||
| 317 | +OPENCLEXT_INTERNAL(__opencl_c_read_write_images, 200, ~0U) | ||
| 318 | +OPENCLEXT_INTERNAL(__opencl_c_program_scope_global_variables, 200, ~0U) | ||
| 319 | +OPENCLEXT_INTERNAL(__opencl_c_fp64, 120, ~0U) | ||
| 320 | +OPENCLEXT_INTERNAL(__opencl_c_int64, 100, ~0U) | ||
| 321 | +OPENCLEXT_INTERNAL(__opencl_c_images, 100, ~0U) | ||
| 322 | #undef OPENCLEXT_INTERNAL | ||
| 323 | |||
| 324 | #ifdef OPENCLEXT | ||
| 325 | diff --git a/clang/include/clang/Basic/OpenCLOptions.h b/clang/include/clang/Basic/OpenCLOptions.h | ||
| 326 | index 15661154eab5..9a3a8e33cadd 100644 | ||
| 327 | --- a/clang/include/clang/Basic/OpenCLOptions.h | ||
| 328 | +++ b/clang/include/clang/Basic/OpenCLOptions.h | ||
| 329 | @@ -16,11 +16,16 @@ | ||
| 330 | |||
| 331 | #include "clang/Basic/LangOptions.h" | ||
| 332 | #include "llvm/ADT/StringMap.h" | ||
| 333 | +#include "llvm/ADT/StringSwitch.h" | ||
| 334 | |||
| 335 | namespace clang { | ||
| 336 | |||
| 337 | /// OpenCL supported extensions and optional core features | ||
| 338 | class OpenCLOptions { | ||
| 339 | + // OpenCL Version | ||
| 340 | + unsigned CLVer = 120; | ||
| 341 | + bool IsOpenCLCPlusPlus = false; | ||
| 342 | + | ||
| 343 | struct Info { | ||
| 344 | bool Supported; // Is this option supported | ||
| 345 | bool Enabled; // Is this option enabled | ||
| 346 | @@ -31,7 +36,38 @@ class OpenCLOptions { | ||
| 347 | :Supported(S), Enabled(E), Avail(A), Core(C){} | ||
| 348 | }; | ||
| 349 | llvm::StringMap<Info> OptMap; | ||
| 350 | + | ||
| 351 | public: | ||
| 352 | + void setOpenCLVersion(const LangOptions &LO) { | ||
| 353 | + IsOpenCLCPlusPlus = LO.OpenCLCPlusPlus; | ||
| 354 | + CLVer = IsOpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 355 | + } | ||
| 356 | + | ||
| 357 | + // Get extension which is semantically equivalent to a given feature | ||
| 358 | + // if exists (e.g. __opencl_c_subgroups -> cl_khr_subgroups) | ||
| 359 | + llvm::Optional<StringRef> getEquivalentExtension(StringRef Feature) const { | ||
| 360 | + return llvm::StringSwitch<llvm::Optional<StringRef>>(Feature) | ||
| 361 | + .Case("__opencl_c_3d_image_writes", | ||
| 362 | + Optional<StringRef>("cl_khr_3d_image_writes")) | ||
| 363 | + .Case("__opencl_c_subgroups", Optional<StringRef>("cl_khr_subgroups")) | ||
| 364 | + .Case("__opencl_c_fp64", Optional<StringRef>("cl_khr_fp64")) | ||
| 365 | + .Default(Optional<StringRef>()); | ||
| 366 | + } | ||
| 367 | + | ||
| 368 | + // Same as above but for extensions | ||
| 369 | + llvm::Optional<StringRef> getEquivalentFeature(StringRef Extension) const { | ||
| 370 | + return llvm::StringSwitch<llvm::Optional<StringRef>>(Extension) | ||
| 371 | + .Case("cl_khr_3d_image_writes", | ||
| 372 | + Optional<StringRef>("__opencl_c_3d_image_writes")) | ||
| 373 | + .Case("cl_khr_subgroups", Optional<StringRef>("__opencl_c_subgroups")) | ||
| 374 | + .Case("cl_khr_fp64", Optional<StringRef>("__opencl_c_fp64")) | ||
| 375 | + .Default(Optional<StringRef>()); | ||
| 376 | + } | ||
| 377 | + | ||
| 378 | + bool isFeature(llvm::StringRef Ext) const { | ||
| 379 | + return Ext.startswith("__opencl_c"); | ||
| 380 | + } | ||
| 381 | + | ||
| 382 | bool isKnown(llvm::StringRef Ext) const { | ||
| 383 | return OptMap.find(Ext) != OptMap.end(); | ||
| 384 | } | ||
| 385 | @@ -42,32 +78,88 @@ public: | ||
| 386 | |||
| 387 | // Is supported as either an extension or an (optional) core feature for | ||
| 388 | // OpenCL version \p CLVer. | ||
| 389 | - bool isSupported(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 390 | + bool isSupported(llvm::StringRef Ext) const { | ||
| 391 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 392 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 393 | auto I = OptMap.find(Ext)->getValue(); | ||
| 394 | return I.Supported && I.Avail <= CLVer; | ||
| 395 | } | ||
| 396 | |||
| 397 | // Is supported (optional) OpenCL core features for OpenCL version \p CLVer. | ||
| 398 | // For supported extension, return false. | ||
| 399 | - bool isSupportedCore(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 400 | + bool isSupportedCore(llvm::StringRef Ext) const { | ||
| 401 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 402 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 403 | auto I = OptMap.find(Ext)->getValue(); | ||
| 404 | return I.Supported && I.Avail <= CLVer && I.Core != ~0U && CLVer >= I.Core; | ||
| 405 | } | ||
| 406 | |||
| 407 | // Is supported OpenCL extension for OpenCL version \p CLVer. | ||
| 408 | // For supported (optional) core feature, return false. | ||
| 409 | - bool isSupportedExtension(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 410 | + bool isSupportedExtension(llvm::StringRef Ext) const { | ||
| 411 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 412 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 413 | auto I = OptMap.find(Ext)->getValue(); | ||
| 414 | return I.Supported && I.Avail <= CLVer && (I.Core == ~0U || CLVer < I.Core); | ||
| 415 | } | ||
| 416 | |||
| 417 | + // Support features whose support is directly related to the | ||
| 418 | + // specific OpenCL version. For example, OpenCL 2.0 supports | ||
| 419 | + // all features that are optional in 3.0 | ||
| 420 | + void adjustFeatures() { | ||
| 421 | + // Support int64 by default (assume compiling for FULL profile) | ||
| 422 | + OptMap["__opencl_c_int64"].Supported = true; | ||
| 423 | + | ||
| 424 | + if (CLVer >= 300) { | ||
| 425 | + // Simultaneously support extension and corresponding feature | ||
| 426 | + for (llvm::StringRef F : | ||
| 427 | + {"__opencl_c_subgroups", "__opencl_c_3d_image_writes", | ||
| 428 | + "__opencl_c_fp64"}) { | ||
| 429 | + auto Ext = getEquivalentExtension(F); | ||
| 430 | + OptMap[*Ext].Supported = OptMap[F].Supported; | ||
| 431 | + } | ||
| 432 | + | ||
| 433 | + // OpenCL C compilers that define the feature macro __opencl_c_pipes or | ||
| 434 | + // or __opencl_c_device_enqueue must also define the | ||
| 435 | + // feature macro __opencl_c_generic_address_space. | ||
| 436 | + if (OptMap["__opencl_c_pipes"].Supported || | ||
| 437 | + OptMap["__opencl_c_device_enqueue"].Supported) | ||
| 438 | + OptMap["__opencl_c_generic_address_space"].Supported = true; | ||
| 439 | + | ||
| 440 | + // OpenCL C compilers that define the feature macro | ||
| 441 | + // __opencl_c_3d_image_writes or __opencl_c_read_write_images must also | ||
| 442 | + // define the feature macro __opencl_c_images | ||
| 443 | + if (OptMap["__opencl_c_3d_image_writes"].Supported || | ||
| 444 | + OptMap["__opencl_c_read_write_images"].Supported) | ||
| 445 | + OptMap["__opencl_c_images"].Supported = true; | ||
| 446 | + | ||
| 447 | + // All other features are already supported with options | ||
| 448 | + // or in target settings | ||
| 449 | + return; | ||
| 450 | + } | ||
| 451 | + | ||
| 452 | + auto FeaturesRange = llvm::make_filter_range( | ||
| 453 | + OptMap, [&](llvm::StringMapEntry<Info> &OptVal) { | ||
| 454 | + auto Opt = OptVal.getKey(); | ||
| 455 | + return isFeature(Opt); | ||
| 456 | + }); | ||
| 457 | + | ||
| 458 | + for (auto &It : FeaturesRange) { | ||
| 459 | + auto &Info = It.getValue(); | ||
| 460 | + // For OpenCL version less then 3.0 some | ||
| 461 | + // features should be supported simulateneously | ||
| 462 | + // with specific extension | ||
| 463 | + if (Optional<llvm::StringRef> Ext = getEquivalentExtension(It.getKey())) | ||
| 464 | + Info.Supported = Info.Enabled = OptMap[*Ext].Supported; | ||
| 465 | + else if (Info.Avail <= CLVer) | ||
| 466 | + Info.Supported = Info.Enabled = true; | ||
| 467 | + } | ||
| 468 | + } | ||
| 469 | + | ||
| 470 | void enable(llvm::StringRef Ext, bool V = true) { | ||
| 471 | + // Ignore disabling extensions if corresponding features | ||
| 472 | + // already supported for OpenCL version higher then 3.0 | ||
| 473 | + if (CLVer >= 300) | ||
| 474 | + if (Optional<llvm::StringRef> F = getEquivalentFeature(Ext)) | ||
| 475 | + if (V != OptMap[*F].Enabled) | ||
| 476 | + return; | ||
| 477 | OptMap[Ext].Enabled = V; | ||
| 478 | } | ||
| 479 | |||
| 480 | @@ -96,7 +188,7 @@ public: | ||
| 481 | OptMap[Ext].Supported = V; | ||
| 482 | } | ||
| 483 | |||
| 484 | - OpenCLOptions(){ | ||
| 485 | + OpenCLOptions() { | ||
| 486 | #define OPENCLEXT_INTERNAL(Ext, AvailVer, CoreVer) \ | ||
| 487 | OptMap[#Ext].Avail = AvailVer; \ | ||
| 488 | OptMap[#Ext].Core = CoreVer; | ||
| 489 | @@ -104,35 +196,86 @@ public: | ||
| 490 | } | ||
| 491 | |||
| 492 | void addSupport(const OpenCLOptions &Opts) { | ||
| 493 | + assert(IsOpenCLCPlusPlus == Opts.IsOpenCLCPlusPlus && CLVer == Opts.CLVer); | ||
| 494 | for (auto &I:Opts.OptMap) | ||
| 495 | - if (I.second.Supported) | ||
| 496 | + if (I.second.Supported) { | ||
| 497 | OptMap[I.getKey()].Supported = true; | ||
| 498 | + // All features are enabled as they are supported | ||
| 499 | + if (isFeature(I.getKey())) | ||
| 500 | + OptMap[I.getKey()].Enabled = true; | ||
| 501 | + } | ||
| 502 | + if (CLVer >= 300) { | ||
| 503 | + // Enabling extensions with respect to features | ||
| 504 | + for (llvm::StringRef Ext : | ||
| 505 | + {"cl_khr_3d_image_writes", "cl_khr_subgroups", "cl_khr_fp64"}) { | ||
| 506 | + auto Feature = getEquivalentFeature(Ext); | ||
| 507 | + enable(Ext, OptMap[*Feature].Enabled); | ||
| 508 | + } | ||
| 509 | + } | ||
| 510 | } | ||
| 511 | |||
| 512 | void copy(const OpenCLOptions &Opts) { | ||
| 513 | + CLVer = Opts.CLVer; | ||
| 514 | + IsOpenCLCPlusPlus = Opts.IsOpenCLCPlusPlus; | ||
| 515 | OptMap = Opts.OptMap; | ||
| 516 | } | ||
| 517 | |||
| 518 | // Turn on or off support of all options. | ||
| 519 | void supportAll(bool On = true) { | ||
| 520 | - for (llvm::StringMap<Info>::iterator I = OptMap.begin(), | ||
| 521 | - E = OptMap.end(); I != E; ++I) | ||
| 522 | - I->second.Supported = On; | ||
| 523 | + for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 524 | + I != E; ++I) | ||
| 525 | + if (!isFeature(I->getKey())) | ||
| 526 | + I->second.Supported = On; | ||
| 527 | } | ||
| 528 | |||
| 529 | void disableAll() { | ||
| 530 | - for (llvm::StringMap<Info>::iterator I = OptMap.begin(), | ||
| 531 | - E = OptMap.end(); I != E; ++I) | ||
| 532 | - I->second.Enabled = false; | ||
| 533 | + for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 534 | + I != E; ++I) { | ||
| 535 | + auto Ext = I->getKey(); | ||
| 536 | + if (!isFeature(Ext)) | ||
| 537 | + enable(Ext, false); | ||
| 538 | + } | ||
| 539 | } | ||
| 540 | |||
| 541 | - void enableSupportedCore(LangOptions LO) { | ||
| 542 | + void enableSupportedCore() { | ||
| 543 | for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 544 | I != E; ++I) | ||
| 545 | - if (isSupportedCore(I->getKey(), LO)) | ||
| 546 | + if (isSupportedCore(I->getKey())) | ||
| 547 | I->second.Enabled = true; | ||
| 548 | } | ||
| 549 | |||
| 550 | + // This enum specifies how OpenCL versions map into values | ||
| 551 | + // for encoding. This is used when generating built-ins | ||
| 552 | + // from tablegen | ||
| 553 | + enum OpenCLVersionsEncodings : unsigned short { | ||
| 554 | + OPENCL_C_100_CODE = 0x1, | ||
| 555 | + OPENCL_C_110_CODE = 0x2, | ||
| 556 | + OPENCL_C_120_CODE = 0x4, | ||
| 557 | + OPENCL_C_200_CODE = 0x8, | ||
| 558 | + OPENCL_C_300_CODE = 0x10, | ||
| 559 | + OPENCL_C_ALL_CODE = 0x1f | ||
| 560 | + }; | ||
| 561 | + | ||
| 562 | + // Encode version into single integer | ||
| 563 | + static unsigned short EncodeVersion(unsigned OpenCLVersion) { | ||
| 564 | + switch (OpenCLVersion) { | ||
| 565 | + default: | ||
| 566 | + llvm_unreachable("Unknown OpenCL version"); | ||
| 567 | + case 0: | ||
| 568 | + return OpenCLVersionsEncodings::OPENCL_C_ALL_CODE; | ||
| 569 | + case 100: | ||
| 570 | + return OpenCLVersionsEncodings::OPENCL_C_100_CODE; | ||
| 571 | + case 110: | ||
| 572 | + return OpenCLVersionsEncodings::OPENCL_C_110_CODE; | ||
| 573 | + case 120: | ||
| 574 | + return OpenCLVersionsEncodings::OPENCL_C_120_CODE; | ||
| 575 | + case 200: | ||
| 576 | + return OpenCLVersionsEncodings::OPENCL_C_200_CODE; | ||
| 577 | + case 300: | ||
| 578 | + return OpenCLVersionsEncodings::OPENCL_C_300_CODE; | ||
| 579 | + } | ||
| 580 | + } | ||
| 581 | + | ||
| 582 | friend class ASTWriter; | ||
| 583 | friend class ASTReader; | ||
| 584 | }; | ||
| 585 | diff --git a/clang/include/clang/Driver/Options.td b/clang/include/clang/Driver/Options.td | ||
| 586 | index 391c895a453b..e03c22c749ad 100644 | ||
| 587 | --- a/clang/include/clang/Driver/Options.td | ||
| 588 | +++ b/clang/include/clang/Driver/Options.td | ||
| 589 | @@ -522,7 +522,7 @@ def cl_mad_enable : Flag<["-"], "cl-mad-enable">, Group<opencl_Group>, Flags<[CC | ||
| 590 | def cl_no_signed_zeros : Flag<["-"], "cl-no-signed-zeros">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 591 | HelpText<"OpenCL only. Allow use of less precise no signed zeros computations in the generated binary.">; | ||
| 592 | def cl_std_EQ : Joined<["-"], "cl-std=">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 593 | - HelpText<"OpenCL language standard to compile for.">, Values<"cl,CL,cl1.1,CL1.1,cl1.2,CL1.2,cl2.0,CL2.0,clc++,CLC++">; | ||
| 594 | + HelpText<"OpenCL language standard to compile for.">, Values<"cl,CL,cl1.1,CL1.1,cl1.2,CL1.2,cl2.0,CL2.0,cl3.0,CL3.0,clc++,CLC++">; | ||
| 595 | def cl_denorms_are_zero : Flag<["-"], "cl-denorms-are-zero">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 596 | HelpText<"OpenCL only. Allow denormals to be flushed to zero.">; | ||
| 597 | def cl_fp32_correctly_rounded_divide_sqrt : Flag<["-"], "cl-fp32-correctly-rounded-divide-sqrt">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 598 | diff --git a/clang/include/clang/Sema/Sema.h b/clang/include/clang/Sema/Sema.h | ||
| 599 | index 842e49602274..d8ac91bc8a31 100644 | ||
| 600 | --- a/clang/include/clang/Sema/Sema.h | ||
| 601 | +++ b/clang/include/clang/Sema/Sema.h | ||
| 602 | @@ -9632,6 +9632,10 @@ public: | ||
| 603 | /// \return true if type is disabled. | ||
| 604 | bool checkOpenCLDisabledDecl(const NamedDecl &D, const Expr &E); | ||
| 605 | |||
| 606 | + bool checkOpenCLSubgroupExtForCallExpr(CallExpr *Call); | ||
| 607 | + | ||
| 608 | + bool isSupportedOpenCLOMemoryOrdering(int64_t Ordering) const; | ||
| 609 | + | ||
| 610 | //===--------------------------------------------------------------------===// | ||
| 611 | // OpenMP directives and clauses. | ||
| 612 | // | ||
| 613 | @@ -11102,6 +11106,11 @@ public: | ||
| 614 | /// that the user intended an assignment used as condition. | ||
| 615 | void DiagnoseEqualityWithExtraParens(ParenExpr *ParenE); | ||
| 616 | |||
| 617 | + template <typename DiagLocT, typename DiagInfoT> | ||
| 618 | + void DiagnoseOpenCLRequiresOption(llvm::StringRef OpenCLOptName, | ||
| 619 | + DiagLocT DiagLoc, DiagInfoT DiagInfo, | ||
| 620 | + unsigned Selector, SourceRange SrcRange); | ||
| 621 | + | ||
| 622 | /// CheckCXXBooleanCondition - Returns true if conversion to bool is invalid. | ||
| 623 | ExprResult CheckCXXBooleanCondition(Expr *CondExpr, bool IsConstexpr = false); | ||
| 624 | |||
| 625 | diff --git a/clang/lib/AST/ASTContext.cpp b/clang/lib/AST/ASTContext.cpp | ||
| 626 | index 1be72efe4de8..2a81fbcde79d 100644 | ||
| 627 | --- a/clang/lib/AST/ASTContext.cpp | ||
| 628 | +++ b/clang/lib/AST/ASTContext.cpp | ||
| 629 | @@ -1490,7 +1490,8 @@ void ASTContext::InitBuiltinTypes(const TargetInfo &Target, | ||
| 630 | ObjCSuperType = QualType(); | ||
| 631 | |||
| 632 | // void * type | ||
| 633 | - if (LangOpts.OpenCLVersion >= 200) { | ||
| 634 | + if (Target.getSupportedOpenCLOpts().isEnabled( | ||
| 635 | + "__opencl_c_generic_address_space")) { | ||
| 636 | auto Q = VoidTy.getQualifiers(); | ||
| 637 | Q.setAddressSpace(LangAS::opencl_generic); | ||
| 638 | VoidPtrTy = getPointerType(getCanonicalType( | ||
| 639 | diff --git a/clang/lib/Basic/Builtins.cpp b/clang/lib/Basic/Builtins.cpp | ||
| 640 | index 0cd89df41b67..7a3067345098 100644 | ||
| 641 | --- a/clang/lib/Basic/Builtins.cpp | ||
| 642 | +++ b/clang/lib/Basic/Builtins.cpp | ||
| 643 | @@ -23,6 +23,8 @@ static const Builtin::Info BuiltinInfo[] = { | ||
| 644 | { #ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, nullptr }, | ||
| 645 | #define LANGBUILTIN(ID, TYPE, ATTRS, LANGS) \ | ||
| 646 | { #ID, TYPE, ATTRS, nullptr, LANGS, nullptr }, | ||
| 647 | +#define OPENCLBUILTIN(ID, TYPE, ATTRS, LANGS, FEATURE) \ | ||
| 648 | + {#ID, TYPE, ATTRS, nullptr, LANGS, FEATURE}, | ||
| 649 | #define LIBBUILTIN(ID, TYPE, ATTRS, HEADER, LANGS) \ | ||
| 650 | { #ID, TYPE, ATTRS, HEADER, LANGS, nullptr }, | ||
| 651 | #include "clang/Basic/Builtins.def" | ||
| 652 | @@ -69,16 +71,17 @@ bool Builtin::Context::builtinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 653 | bool ObjCUnsupported = !LangOpts.ObjC && BuiltinInfo.Langs == OBJC_LANG; | ||
| 654 | bool OclC1Unsupported = (LangOpts.OpenCLVersion / 100) != 1 && | ||
| 655 | (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES ) == OCLC1X_LANG; | ||
| 656 | - bool OclC2Unsupported = | ||
| 657 | - (LangOpts.OpenCLVersion != 200 && !LangOpts.OpenCLCPlusPlus) && | ||
| 658 | - (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES) == OCLC20_LANG; | ||
| 659 | + bool OclC2PUnsupported = | ||
| 660 | + (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES) == OCLC2P_LANG && | ||
| 661 | + ((LangOpts.OpenCLVersion < 200 && !LangOpts.OpenCLCPlusPlus) || | ||
| 662 | + !OclBuiltinIsSupported(BuiltinInfo, LangOpts)); | ||
| 663 | bool OclCUnsupported = !LangOpts.OpenCL && | ||
| 664 | (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES); | ||
| 665 | bool OpenMPUnsupported = !LangOpts.OpenMP && BuiltinInfo.Langs == OMP_LANG; | ||
| 666 | bool CPlusPlusUnsupported = | ||
| 667 | !LangOpts.CPlusPlus && BuiltinInfo.Langs == CXX_LANG; | ||
| 668 | return !BuiltinsUnsupported && !MathBuiltinsUnsupported && !OclCUnsupported && | ||
| 669 | - !OclC1Unsupported && !OclC2Unsupported && !OpenMPUnsupported && | ||
| 670 | + !OclC1Unsupported && !OclC2PUnsupported && !OpenMPUnsupported && | ||
| 671 | !GnuModeUnsupported && !MSModeUnsupported && !ObjCUnsupported && | ||
| 672 | !CPlusPlusUnsupported; | ||
| 673 | } | ||
| 674 | @@ -191,3 +194,20 @@ bool Builtin::Context::canBeRedeclared(unsigned ID) const { | ||
| 675 | (!hasReferenceArgsOrResult(ID) && | ||
| 676 | !hasCustomTypechecking(ID)); | ||
| 677 | } | ||
| 678 | + | ||
| 679 | +bool Builtin::Context::OclBuiltinIsSupported( | ||
| 680 | + const Builtin::Info &BuiltinInfo, const LangOptions &LangOpts) const { | ||
| 681 | + if (!requiresFeatures(BuiltinInfo)) | ||
| 682 | + return true; | ||
| 683 | + | ||
| 684 | + return llvm::StringSwitch<bool>(BuiltinInfo.Features) | ||
| 685 | + .Case("__opencl_c_device_enqueue", LangOpts.Blocks) | ||
| 686 | + .Case("__opencl_c_generic_address_space", LangOpts.OpenCLGenericKeyword) | ||
| 687 | + .Case("__opencl_c_pipes", LangOpts.OpenCLPipeKeyword) | ||
| 688 | + .Default(false); | ||
| 689 | +} | ||
| 690 | + | ||
| 691 | +bool Builtin::Context::requiresFeatures( | ||
| 692 | + const Builtin::Info &BuiltinInfo) const { | ||
| 693 | + return BuiltinInfo.Features && llvm::StringRef(BuiltinInfo.Features) != ""; | ||
| 694 | +} | ||
| 695 | diff --git a/clang/lib/Basic/TargetInfo.cpp b/clang/lib/Basic/TargetInfo.cpp | ||
| 696 | index 3a21a19e1f19..795311d5934e 100644 | ||
| 697 | --- a/clang/lib/Basic/TargetInfo.cpp | ||
| 698 | +++ b/clang/lib/Basic/TargetInfo.cpp | ||
| 699 | @@ -377,6 +377,17 @@ void TargetInfo::adjust(LangOptions &Opts) { | ||
| 700 | HalfFormat = &llvm::APFloat::IEEEhalf(); | ||
| 701 | FloatFormat = &llvm::APFloat::IEEEsingle(); | ||
| 702 | LongDoubleFormat = &llvm::APFloat::IEEEquad(); | ||
| 703 | + | ||
| 704 | + auto &SupportedOCLOpts = getTargetOpts().SupportedOpenCLOptions; | ||
| 705 | + | ||
| 706 | + SupportedOCLOpts.setOpenCLVersion(Opts); | ||
| 707 | + SupportedOCLOpts.adjustFeatures(); | ||
| 708 | + | ||
| 709 | + if (!Opts.OpenCLCPlusPlus && Opts.OpenCLVersion >= 200) | ||
| 710 | + Opts.Blocks = SupportedOCLOpts.isSupported("__opencl_c_device_enqueue"); | ||
| 711 | + Opts.OpenCLGenericKeyword = | ||
| 712 | + SupportedOCLOpts.isSupported("__opencl_c_generic_address_space"); | ||
| 713 | + Opts.OpenCLPipeKeyword = SupportedOCLOpts.isSupported("__opencl_c_pipes"); | ||
| 714 | } | ||
| 715 | |||
| 716 | if (Opts.LongDoubleSize) { | ||
| 717 | diff --git a/clang/lib/Basic/Targets.cpp b/clang/lib/Basic/Targets.cpp | ||
| 718 | index c063f8ca4472..b394be18a234 100644 | ||
| 719 | --- a/clang/lib/Basic/Targets.cpp | ||
| 720 | +++ b/clang/lib/Basic/Targets.cpp | ||
| 721 | @@ -39,7 +39,6 @@ | ||
| 722 | #include "clang/Basic/Diagnostic.h" | ||
| 723 | #include "llvm/ADT/StringExtras.h" | ||
| 724 | #include "llvm/ADT/Triple.h" | ||
| 725 | - | ||
| 726 | using namespace clang; | ||
| 727 | |||
| 728 | namespace clang { | ||
| 729 | diff --git a/clang/lib/CodeGen/CodeGenFunction.cpp b/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 730 | index 648e6d9c214a..6d839fa61abc 100644 | ||
| 731 | --- a/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 732 | +++ b/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 733 | @@ -2303,11 +2303,11 @@ void CodeGenFunction::checkTargetFeatures(SourceLocation Loc, | ||
| 734 | std::string MissingFeature; | ||
| 735 | if (BuiltinID) { | ||
| 736 | SmallVector<StringRef, 1> ReqFeatures; | ||
| 737 | - const char *FeatureList = | ||
| 738 | - CGM.getContext().BuiltinInfo.getRequiredFeatures(BuiltinID); | ||
| 739 | // Return if the builtin doesn't have any required features. | ||
| 740 | - if (!FeatureList || StringRef(FeatureList) == "") | ||
| 741 | + if (!CGM.getContext().BuiltinInfo.requiresFeatures(BuiltinID)) | ||
| 742 | return; | ||
| 743 | + const char *FeatureList = | ||
| 744 | + CGM.getContext().BuiltinInfo.getRequiredFeatures(BuiltinID); | ||
| 745 | StringRef(FeatureList).split(ReqFeatures, ','); | ||
| 746 | if (!hasRequiredFeatures(ReqFeatures, CGM, FD, MissingFeature)) | ||
| 747 | CGM.getDiags().Report(Loc, diag::err_builtin_needs_feature) | ||
| 748 | diff --git a/clang/lib/Frontend/CompilerInvocation.cpp b/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 749 | index e98a407ac42f..18fa06bf3c6d 100644 | ||
| 750 | --- a/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 751 | +++ b/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 752 | @@ -2298,6 +2298,8 @@ void CompilerInvocation::setLangDefaults(LangOptions &Opts, InputKind IK, | ||
| 753 | Opts.OpenCLVersion = 120; | ||
| 754 | else if (LangStd == LangStandard::lang_opencl20) | ||
| 755 | Opts.OpenCLVersion = 200; | ||
| 756 | + else if (LangStd == LangStandard::lang_opencl30) | ||
| 757 | + Opts.OpenCLVersion = 300; | ||
| 758 | else if (LangStd == LangStandard::lang_openclcpp) | ||
| 759 | Opts.OpenCLCPlusPlusVersion = 100; | ||
| 760 | |||
| 761 | @@ -2498,14 +2500,15 @@ static void ParseLangArgs(LangOptions &Opts, ArgList &Args, InputKind IK, | ||
| 762 | // -cl-std only applies for OpenCL language standards. | ||
| 763 | // Override the -std option in this case. | ||
| 764 | if (const Arg *A = Args.getLastArg(OPT_cl_std_EQ)) { | ||
| 765 | - LangStandard::Kind OpenCLLangStd | ||
| 766 | - = llvm::StringSwitch<LangStandard::Kind>(A->getValue()) | ||
| 767 | - .Cases("cl", "CL", LangStandard::lang_opencl10) | ||
| 768 | - .Cases("cl1.1", "CL1.1", LangStandard::lang_opencl11) | ||
| 769 | - .Cases("cl1.2", "CL1.2", LangStandard::lang_opencl12) | ||
| 770 | - .Cases("cl2.0", "CL2.0", LangStandard::lang_opencl20) | ||
| 771 | - .Cases("clc++", "CLC++", LangStandard::lang_openclcpp) | ||
| 772 | - .Default(LangStandard::lang_unspecified); | ||
| 773 | + LangStandard::Kind OpenCLLangStd = | ||
| 774 | + llvm::StringSwitch<LangStandard::Kind>(A->getValue()) | ||
| 775 | + .Cases("cl", "CL", LangStandard::lang_opencl10) | ||
| 776 | + .Cases("cl1.1", "CL1.1", LangStandard::lang_opencl11) | ||
| 777 | + .Cases("cl1.2", "CL1.2", LangStandard::lang_opencl12) | ||
| 778 | + .Cases("cl2.0", "CL2.0", LangStandard::lang_opencl20) | ||
| 779 | + .Cases("cl3.0", "CL3.0", LangStandard::lang_opencl30) | ||
| 780 | + .Cases("clc++", "CLC++", LangStandard::lang_openclcpp) | ||
| 781 | + .Default(LangStandard::lang_unspecified); | ||
| 782 | |||
| 783 | if (OpenCLLangStd == LangStandard::lang_unspecified) { | ||
| 784 | Diags.Report(diag::err_drv_invalid_value) | ||
| 785 | @@ -2787,8 +2790,7 @@ static void ParseLangArgs(LangOptions &Opts, ArgList &Args, InputKind IK, | ||
| 786 | |||
| 787 | Opts.RTTI = Opts.CPlusPlus && !Args.hasArg(OPT_fno_rtti); | ||
| 788 | Opts.RTTIData = Opts.RTTI && !Args.hasArg(OPT_fno_rtti_data); | ||
| 789 | - Opts.Blocks = Args.hasArg(OPT_fblocks) || (Opts.OpenCL | ||
| 790 | - && Opts.OpenCLVersion == 200); | ||
| 791 | + Opts.Blocks = Args.hasArg(OPT_fblocks); | ||
| 792 | Opts.BlocksRuntimeOptional = Args.hasArg(OPT_fblocks_runtime_optional); | ||
| 793 | Opts.Coroutines = Opts.CPlusPlus2a || Args.hasArg(OPT_fcoroutines_ts); | ||
| 794 | |||
| 795 | diff --git a/clang/lib/Frontend/InitPreprocessor.cpp b/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 796 | index c273cb96d9b9..aefd208e6cd3 100644 | ||
| 797 | --- a/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 798 | +++ b/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 799 | @@ -445,6 +445,9 @@ static void InitializeStandardPredefinedMacros(const TargetInfo &TI, | ||
| 800 | case 200: | ||
| 801 | Builder.defineMacro("__OPENCL_C_VERSION__", "200"); | ||
| 802 | break; | ||
| 803 | + case 300: | ||
| 804 | + Builder.defineMacro("__OPENCL_C_VERSION__", "300"); | ||
| 805 | + break; | ||
| 806 | default: | ||
| 807 | llvm_unreachable("Unsupported OpenCL version"); | ||
| 808 | } | ||
| 809 | @@ -453,6 +456,7 @@ static void InitializeStandardPredefinedMacros(const TargetInfo &TI, | ||
| 810 | Builder.defineMacro("CL_VERSION_1_1", "110"); | ||
| 811 | Builder.defineMacro("CL_VERSION_1_2", "120"); | ||
| 812 | Builder.defineMacro("CL_VERSION_2_0", "200"); | ||
| 813 | + Builder.defineMacro("CL_VERSION_3_0", "300"); | ||
| 814 | |||
| 815 | if (TI.isLittleEndian()) | ||
| 816 | Builder.defineMacro("__ENDIAN_LITTLE__"); | ||
| 817 | @@ -1101,7 +1105,7 @@ static void InitializePredefinedMacros(const TargetInfo &TI, | ||
| 818 | // OpenCL definitions. | ||
| 819 | if (LangOpts.OpenCL) { | ||
| 820 | #define OPENCLEXT(Ext) \ | ||
| 821 | - if (TI.getSupportedOpenCLOpts().isSupported(#Ext, LangOpts)) \ | ||
| 822 | + if (TI.getSupportedOpenCLOpts().isSupported(#Ext)) \ | ||
| 823 | Builder.defineMacro(#Ext); | ||
| 824 | #include "clang/Basic/OpenCLExtensions.def" | ||
| 825 | |||
| 826 | diff --git a/clang/lib/Headers/opencl-c-base.h b/clang/lib/Headers/opencl-c-base.h | ||
| 827 | index 430e07d36f62..2cc688ccc3da 100644 | ||
| 828 | --- a/clang/lib/Headers/opencl-c-base.h | ||
| 829 | +++ b/clang/lib/Headers/opencl-c-base.h | ||
| 830 | @@ -9,6 +9,59 @@ | ||
| 831 | #ifndef _OPENCL_BASE_H_ | ||
| 832 | #define _OPENCL_BASE_H_ | ||
| 833 | |||
| 834 | +// Add predefined macros to build headers with standalone executable | ||
| 835 | +#ifndef CL_VERSION_3_0 | ||
| 836 | + #define CL_VERSION_3_0 300 | ||
| 837 | +#endif | ||
| 838 | + | ||
| 839 | +// Define features for 2.0 for header backward compatibility | ||
| 840 | +#ifndef __opencl_c_int64 | ||
| 841 | + #define __opencl_c_int64 1 | ||
| 842 | +#endif | ||
| 843 | +#if __OPENCL_C_VERSION__ != CL_VERSION_3_0 | ||
| 844 | + #ifndef __opencl_c_images | ||
| 845 | + #define __opencl_c_images 1 | ||
| 846 | + #endif | ||
| 847 | +#endif | ||
| 848 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 849 | +#ifndef __opencl_c_pipes | ||
| 850 | + #define __opencl_c_pipes 1 | ||
| 851 | +#endif | ||
| 852 | +#ifndef __opencl_c_generic_address_space | ||
| 853 | + #define __opencl_c_generic_address_space 1 | ||
| 854 | +#endif | ||
| 855 | +#ifndef __opencl_c_work_group_collective_functions | ||
| 856 | + #define __opencl_c_work_group_collective_functions 1 | ||
| 857 | +#endif | ||
| 858 | +#ifndef __opencl_c_atomic_order_acq_rel | ||
| 859 | + #define __opencl_c_atomic_order_acq_rel 1 | ||
| 860 | +#endif | ||
| 861 | +#ifndef __opencl_c_atomic_order_seq_cst | ||
| 862 | + #define __opencl_c_atomic_order_seq_cst 1 | ||
| 863 | +#endif | ||
| 864 | +#ifndef __opencl_c_atomic_scope_device | ||
| 865 | + #define __opencl_c_atomic_scope_device 1 | ||
| 866 | +#endif | ||
| 867 | +#ifndef __opencl_c_atomic_scope_all_devices | ||
| 868 | + #define __opencl_c_atomic_scope_all_devices 1 | ||
| 869 | +#endif | ||
| 870 | +#ifndef __opencl_c_subgroups | ||
| 871 | + #define __opencl_c_subgroups 1 | ||
| 872 | +#endif | ||
| 873 | +#ifndef __opencl_c_3d_image_writes | ||
| 874 | + #define __opencl_c_3d_image_writes 1 | ||
| 875 | +#endif | ||
| 876 | +#ifndef __opencl_c_device_enqueue | ||
| 877 | + #define __opencl_c_device_enqueue 1 | ||
| 878 | +#endif | ||
| 879 | +#ifndef __opencl_c_read_write_images | ||
| 880 | + #define __opencl_c_read_write_images 1 | ||
| 881 | +#endif | ||
| 882 | +#ifndef __opencl_c_program_scope_global_variables | ||
| 883 | + #define __opencl_c_program_scope_global_variables 1 | ||
| 884 | +#endif | ||
| 885 | +#endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 886 | + | ||
| 887 | // built-in scalar data types: | ||
| 888 | |||
| 889 | /** | ||
| 890 | @@ -115,7 +168,12 @@ typedef half half4 __attribute__((ext_vector_type(4))); | ||
| 891 | typedef half half8 __attribute__((ext_vector_type(8))); | ||
| 892 | typedef half half16 __attribute__((ext_vector_type(16))); | ||
| 893 | #endif | ||
| 894 | -#ifdef cl_khr_fp64 | ||
| 895 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 896 | + | ||
| 897 | +#ifndef __opencl_c_fp64 | ||
| 898 | + #define __opencl_c_fp64 1 | ||
| 899 | +#endif | ||
| 900 | + | ||
| 901 | #if __OPENCL_C_VERSION__ < CL_VERSION_1_2 | ||
| 902 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 903 | #endif | ||
| 904 | @@ -281,9 +339,17 @@ typedef uint cl_mem_fence_flags; | ||
| 905 | typedef enum memory_scope { | ||
| 906 | memory_scope_work_item = __OPENCL_MEMORY_SCOPE_WORK_ITEM, | ||
| 907 | memory_scope_work_group = __OPENCL_MEMORY_SCOPE_WORK_GROUP, | ||
| 908 | +#ifdef __opencl_c_atomic_scope_device | ||
| 909 | memory_scope_device = __OPENCL_MEMORY_SCOPE_DEVICE, | ||
| 910 | +#endif | ||
| 911 | +#ifdef __opencl_c_atomic_scope_all_devices | ||
| 912 | + #if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 913 | + memory_scope_all_devices = __OPENCL_MEMORY_SCOPE_ALL_SVM_DEVICES, | ||
| 914 | + #endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 915 | memory_scope_all_svm_devices = __OPENCL_MEMORY_SCOPE_ALL_SVM_DEVICES, | ||
| 916 | -#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) | ||
| 917 | +#endif | ||
| 918 | +#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) || \ | ||
| 919 | + defined(__opencl_c_subgroups) | ||
| 920 | memory_scope_sub_group = __OPENCL_MEMORY_SCOPE_SUB_GROUP | ||
| 921 | #endif | ||
| 922 | } memory_scope; | ||
| 923 | @@ -301,13 +367,14 @@ typedef enum memory_scope { | ||
| 924 | #define ATOMIC_FLAG_INIT 0 | ||
| 925 | |||
| 926 | // enum values aligned with what clang uses in EmitAtomicExpr() | ||
| 927 | -typedef enum memory_order | ||
| 928 | -{ | ||
| 929 | +typedef enum memory_order { | ||
| 930 | memory_order_relaxed = __ATOMIC_RELAXED, | ||
| 931 | memory_order_acquire = __ATOMIC_ACQUIRE, | ||
| 932 | memory_order_release = __ATOMIC_RELEASE, | ||
| 933 | memory_order_acq_rel = __ATOMIC_ACQ_REL, | ||
| 934 | +#ifdef __opencl_c_atomic_order_seq_cst | ||
| 935 | memory_order_seq_cst = __ATOMIC_SEQ_CST | ||
| 936 | +#endif //__opencl_c_atomic_order_seq_cst | ||
| 937 | } memory_order; | ||
| 938 | |||
| 939 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 940 | diff --git a/clang/lib/Headers/opencl-c.h b/clang/lib/Headers/opencl-c.h | ||
| 941 | index 3210f93cc851..93a946cec5b1 100644 | ||
| 942 | --- a/clang/lib/Headers/opencl-c.h | ||
| 943 | +++ b/clang/lib/Headers/opencl-c.h | ||
| 944 | @@ -35,7 +35,6 @@ | ||
| 945 | #define __purefn __attribute__((pure)) | ||
| 946 | #define __cnfn __attribute__((const)) | ||
| 947 | |||
| 948 | - | ||
| 949 | // OpenCL v1.1/1.2/2.0 s6.2.3 - Explicit conversions | ||
| 950 | |||
| 951 | char __ovld __cnfn convert_char_rte(char); | ||
| 952 | @@ -4632,7 +4631,7 @@ float16 __ovld __cnfn convert_float16(float16); | ||
| 953 | |||
| 954 | // Conversions with double data type parameters or return value. | ||
| 955 | |||
| 956 | -#ifdef cl_khr_fp64 | ||
| 957 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 958 | char __ovld __cnfn convert_char(double); | ||
| 959 | char __ovld __cnfn convert_char_rte(double); | ||
| 960 | char __ovld __cnfn convert_char_rtn(double); | ||
| 961 | @@ -5452,7 +5451,7 @@ double16 __ovld __cnfn convert_double16_rtz(uchar16); | ||
| 962 | double16 __ovld __cnfn convert_double16_rtz(uint16); | ||
| 963 | double16 __ovld __cnfn convert_double16_rtz(ulong16); | ||
| 964 | double16 __ovld __cnfn convert_double16_rtz(ushort16); | ||
| 965 | -#endif //cl_khr_fp64 | ||
| 966 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 967 | |||
| 968 | #ifdef cl_khr_fp16 | ||
| 969 | // Convert half types to non-double types. | ||
| 970 | @@ -6270,7 +6269,7 @@ half16 __ovld __cnfn convert_half16_rtz(float16); | ||
| 971 | half16 __ovld __cnfn convert_half16_rtz(half16); | ||
| 972 | |||
| 973 | // Convert half types to double types. | ||
| 974 | -#ifdef cl_khr_fp64 | ||
| 975 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 976 | double __ovld __cnfn convert_double(half); | ||
| 977 | double __ovld __cnfn convert_double_rte(half); | ||
| 978 | double __ovld __cnfn convert_double_rtp(half); | ||
| 979 | @@ -6333,7 +6332,7 @@ half16 __ovld __cnfn convert_half16_rte(double16); | ||
| 980 | half16 __ovld __cnfn convert_half16_rtp(double16); | ||
| 981 | half16 __ovld __cnfn convert_half16_rtn(double16); | ||
| 982 | half16 __ovld __cnfn convert_half16_rtz(double16); | ||
| 983 | -#endif //cl_khr_fp64 | ||
| 984 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 985 | |||
| 986 | #endif // cl_khr_fp16 | ||
| 987 | |||
| 988 | @@ -6404,14 +6403,14 @@ half16 __ovld __cnfn convert_half16_rtz(double16); | ||
| 989 | #define as_float8(x) __builtin_astype((x), float8) | ||
| 990 | #define as_float16(x) __builtin_astype((x), float16) | ||
| 991 | |||
| 992 | -#ifdef cl_khr_fp64 | ||
| 993 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 994 | #define as_double(x) __builtin_astype((x), double) | ||
| 995 | #define as_double2(x) __builtin_astype((x), double2) | ||
| 996 | #define as_double3(x) __builtin_astype((x), double3) | ||
| 997 | #define as_double4(x) __builtin_astype((x), double4) | ||
| 998 | #define as_double8(x) __builtin_astype((x), double8) | ||
| 999 | #define as_double16(x) __builtin_astype((x), double16) | ||
| 1000 | -#endif //cl_khr_fp64 | ||
| 1001 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1002 | |||
| 1003 | #ifdef cl_khr_fp16 | ||
| 1004 | #define as_half(x) __builtin_astype((x), half) | ||
| 1005 | @@ -6534,14 +6533,14 @@ float3 __ovld __cnfn acos(float3); | ||
| 1006 | float4 __ovld __cnfn acos(float4); | ||
| 1007 | float8 __ovld __cnfn acos(float8); | ||
| 1008 | float16 __ovld __cnfn acos(float16); | ||
| 1009 | -#ifdef cl_khr_fp64 | ||
| 1010 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1011 | double __ovld __cnfn acos(double); | ||
| 1012 | double2 __ovld __cnfn acos(double2); | ||
| 1013 | double3 __ovld __cnfn acos(double3); | ||
| 1014 | double4 __ovld __cnfn acos(double4); | ||
| 1015 | double8 __ovld __cnfn acos(double8); | ||
| 1016 | double16 __ovld __cnfn acos(double16); | ||
| 1017 | -#endif //cl_khr_fp64 | ||
| 1018 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1019 | #ifdef cl_khr_fp16 | ||
| 1020 | half __ovld __cnfn acos(half); | ||
| 1021 | half2 __ovld __cnfn acos(half2); | ||
| 1022 | @@ -6560,14 +6559,14 @@ float3 __ovld __cnfn acosh(float3); | ||
| 1023 | float4 __ovld __cnfn acosh(float4); | ||
| 1024 | float8 __ovld __cnfn acosh(float8); | ||
| 1025 | float16 __ovld __cnfn acosh(float16); | ||
| 1026 | -#ifdef cl_khr_fp64 | ||
| 1027 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1028 | double __ovld __cnfn acosh(double); | ||
| 1029 | double2 __ovld __cnfn acosh(double2); | ||
| 1030 | double3 __ovld __cnfn acosh(double3); | ||
| 1031 | double4 __ovld __cnfn acosh(double4); | ||
| 1032 | double8 __ovld __cnfn acosh(double8); | ||
| 1033 | double16 __ovld __cnfn acosh(double16); | ||
| 1034 | -#endif //cl_khr_fp64 | ||
| 1035 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1036 | #ifdef cl_khr_fp16 | ||
| 1037 | half __ovld __cnfn acosh(half); | ||
| 1038 | half2 __ovld __cnfn acosh(half2); | ||
| 1039 | @@ -6586,14 +6585,14 @@ float3 __ovld __cnfn acospi(float3 x); | ||
| 1040 | float4 __ovld __cnfn acospi(float4 x); | ||
| 1041 | float8 __ovld __cnfn acospi(float8 x); | ||
| 1042 | float16 __ovld __cnfn acospi(float16 x); | ||
| 1043 | -#ifdef cl_khr_fp64 | ||
| 1044 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1045 | double __ovld __cnfn acospi(double x); | ||
| 1046 | double2 __ovld __cnfn acospi(double2 x); | ||
| 1047 | double3 __ovld __cnfn acospi(double3 x); | ||
| 1048 | double4 __ovld __cnfn acospi(double4 x); | ||
| 1049 | double8 __ovld __cnfn acospi(double8 x); | ||
| 1050 | double16 __ovld __cnfn acospi(double16 x); | ||
| 1051 | -#endif //cl_khr_fp64 | ||
| 1052 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1053 | #ifdef cl_khr_fp16 | ||
| 1054 | half __ovld __cnfn acospi(half x); | ||
| 1055 | half2 __ovld __cnfn acospi(half2 x); | ||
| 1056 | @@ -6612,14 +6611,14 @@ float3 __ovld __cnfn asin(float3); | ||
| 1057 | float4 __ovld __cnfn asin(float4); | ||
| 1058 | float8 __ovld __cnfn asin(float8); | ||
| 1059 | float16 __ovld __cnfn asin(float16); | ||
| 1060 | -#ifdef cl_khr_fp64 | ||
| 1061 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1062 | double __ovld __cnfn asin(double); | ||
| 1063 | double2 __ovld __cnfn asin(double2); | ||
| 1064 | double3 __ovld __cnfn asin(double3); | ||
| 1065 | double4 __ovld __cnfn asin(double4); | ||
| 1066 | double8 __ovld __cnfn asin(double8); | ||
| 1067 | double16 __ovld __cnfn asin(double16); | ||
| 1068 | -#endif //cl_khr_fp64 | ||
| 1069 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1070 | #ifdef cl_khr_fp16 | ||
| 1071 | half __ovld __cnfn asin(half); | ||
| 1072 | half2 __ovld __cnfn asin(half2); | ||
| 1073 | @@ -6638,14 +6637,14 @@ float3 __ovld __cnfn asinh(float3); | ||
| 1074 | float4 __ovld __cnfn asinh(float4); | ||
| 1075 | float8 __ovld __cnfn asinh(float8); | ||
| 1076 | float16 __ovld __cnfn asinh(float16); | ||
| 1077 | -#ifdef cl_khr_fp64 | ||
| 1078 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1079 | double __ovld __cnfn asinh(double); | ||
| 1080 | double2 __ovld __cnfn asinh(double2); | ||
| 1081 | double3 __ovld __cnfn asinh(double3); | ||
| 1082 | double4 __ovld __cnfn asinh(double4); | ||
| 1083 | double8 __ovld __cnfn asinh(double8); | ||
| 1084 | double16 __ovld __cnfn asinh(double16); | ||
| 1085 | -#endif //cl_khr_fp64 | ||
| 1086 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1087 | #ifdef cl_khr_fp16 | ||
| 1088 | half __ovld __cnfn asinh(half); | ||
| 1089 | half2 __ovld __cnfn asinh(half2); | ||
| 1090 | @@ -6664,14 +6663,14 @@ float3 __ovld __cnfn asinpi(float3 x); | ||
| 1091 | float4 __ovld __cnfn asinpi(float4 x); | ||
| 1092 | float8 __ovld __cnfn asinpi(float8 x); | ||
| 1093 | float16 __ovld __cnfn asinpi(float16 x); | ||
| 1094 | -#ifdef cl_khr_fp64 | ||
| 1095 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1096 | double __ovld __cnfn asinpi(double x); | ||
| 1097 | double2 __ovld __cnfn asinpi(double2 x); | ||
| 1098 | double3 __ovld __cnfn asinpi(double3 x); | ||
| 1099 | double4 __ovld __cnfn asinpi(double4 x); | ||
| 1100 | double8 __ovld __cnfn asinpi(double8 x); | ||
| 1101 | double16 __ovld __cnfn asinpi(double16 x); | ||
| 1102 | -#endif //cl_khr_fp64 | ||
| 1103 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1104 | #ifdef cl_khr_fp16 | ||
| 1105 | half __ovld __cnfn asinpi(half x); | ||
| 1106 | half2 __ovld __cnfn asinpi(half2 x); | ||
| 1107 | @@ -6690,14 +6689,14 @@ float3 __ovld __cnfn atan(float3 y_over_x); | ||
| 1108 | float4 __ovld __cnfn atan(float4 y_over_x); | ||
| 1109 | float8 __ovld __cnfn atan(float8 y_over_x); | ||
| 1110 | float16 __ovld __cnfn atan(float16 y_over_x); | ||
| 1111 | -#ifdef cl_khr_fp64 | ||
| 1112 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1113 | double __ovld __cnfn atan(double y_over_x); | ||
| 1114 | double2 __ovld __cnfn atan(double2 y_over_x); | ||
| 1115 | double3 __ovld __cnfn atan(double3 y_over_x); | ||
| 1116 | double4 __ovld __cnfn atan(double4 y_over_x); | ||
| 1117 | double8 __ovld __cnfn atan(double8 y_over_x); | ||
| 1118 | double16 __ovld __cnfn atan(double16 y_over_x); | ||
| 1119 | -#endif //cl_khr_fp64 | ||
| 1120 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1121 | #ifdef cl_khr_fp16 | ||
| 1122 | half __ovld __cnfn atan(half y_over_x); | ||
| 1123 | half2 __ovld __cnfn atan(half2 y_over_x); | ||
| 1124 | @@ -6716,14 +6715,14 @@ float3 __ovld __cnfn atan2(float3 y, float3 x); | ||
| 1125 | float4 __ovld __cnfn atan2(float4 y, float4 x); | ||
| 1126 | float8 __ovld __cnfn atan2(float8 y, float8 x); | ||
| 1127 | float16 __ovld __cnfn atan2(float16 y, float16 x); | ||
| 1128 | -#ifdef cl_khr_fp64 | ||
| 1129 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1130 | double __ovld __cnfn atan2(double y, double x); | ||
| 1131 | double2 __ovld __cnfn atan2(double2 y, double2 x); | ||
| 1132 | double3 __ovld __cnfn atan2(double3 y, double3 x); | ||
| 1133 | double4 __ovld __cnfn atan2(double4 y, double4 x); | ||
| 1134 | double8 __ovld __cnfn atan2(double8 y, double8 x); | ||
| 1135 | double16 __ovld __cnfn atan2(double16 y, double16 x); | ||
| 1136 | -#endif //cl_khr_fp64 | ||
| 1137 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1138 | #ifdef cl_khr_fp16 | ||
| 1139 | half __ovld __cnfn atan2(half y, half x); | ||
| 1140 | half2 __ovld __cnfn atan2(half2 y, half2 x); | ||
| 1141 | @@ -6742,14 +6741,14 @@ float3 __ovld __cnfn atanh(float3); | ||
| 1142 | float4 __ovld __cnfn atanh(float4); | ||
| 1143 | float8 __ovld __cnfn atanh(float8); | ||
| 1144 | float16 __ovld __cnfn atanh(float16); | ||
| 1145 | -#ifdef cl_khr_fp64 | ||
| 1146 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1147 | double __ovld __cnfn atanh(double); | ||
| 1148 | double2 __ovld __cnfn atanh(double2); | ||
| 1149 | double3 __ovld __cnfn atanh(double3); | ||
| 1150 | double4 __ovld __cnfn atanh(double4); | ||
| 1151 | double8 __ovld __cnfn atanh(double8); | ||
| 1152 | double16 __ovld __cnfn atanh(double16); | ||
| 1153 | -#endif //cl_khr_fp64 | ||
| 1154 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1155 | #ifdef cl_khr_fp16 | ||
| 1156 | half __ovld __cnfn atanh(half); | ||
| 1157 | half2 __ovld __cnfn atanh(half2); | ||
| 1158 | @@ -6768,14 +6767,14 @@ float3 __ovld __cnfn atanpi(float3 x); | ||
| 1159 | float4 __ovld __cnfn atanpi(float4 x); | ||
| 1160 | float8 __ovld __cnfn atanpi(float8 x); | ||
| 1161 | float16 __ovld __cnfn atanpi(float16 x); | ||
| 1162 | -#ifdef cl_khr_fp64 | ||
| 1163 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1164 | double __ovld __cnfn atanpi(double x); | ||
| 1165 | double2 __ovld __cnfn atanpi(double2 x); | ||
| 1166 | double3 __ovld __cnfn atanpi(double3 x); | ||
| 1167 | double4 __ovld __cnfn atanpi(double4 x); | ||
| 1168 | double8 __ovld __cnfn atanpi(double8 x); | ||
| 1169 | double16 __ovld __cnfn atanpi(double16 x); | ||
| 1170 | -#endif //cl_khr_fp64 | ||
| 1171 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1172 | #ifdef cl_khr_fp16 | ||
| 1173 | half __ovld __cnfn atanpi(half x); | ||
| 1174 | half2 __ovld __cnfn atanpi(half2 x); | ||
| 1175 | @@ -6794,14 +6793,14 @@ float3 __ovld __cnfn atan2pi(float3 y, float3 x); | ||
| 1176 | float4 __ovld __cnfn atan2pi(float4 y, float4 x); | ||
| 1177 | float8 __ovld __cnfn atan2pi(float8 y, float8 x); | ||
| 1178 | float16 __ovld __cnfn atan2pi(float16 y, float16 x); | ||
| 1179 | -#ifdef cl_khr_fp64 | ||
| 1180 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1181 | double __ovld __cnfn atan2pi(double y, double x); | ||
| 1182 | double2 __ovld __cnfn atan2pi(double2 y, double2 x); | ||
| 1183 | double3 __ovld __cnfn atan2pi(double3 y, double3 x); | ||
| 1184 | double4 __ovld __cnfn atan2pi(double4 y, double4 x); | ||
| 1185 | double8 __ovld __cnfn atan2pi(double8 y, double8 x); | ||
| 1186 | double16 __ovld __cnfn atan2pi(double16 y, double16 x); | ||
| 1187 | -#endif //cl_khr_fp64 | ||
| 1188 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1189 | #ifdef cl_khr_fp16 | ||
| 1190 | half __ovld __cnfn atan2pi(half y, half x); | ||
| 1191 | half2 __ovld __cnfn atan2pi(half2 y, half2 x); | ||
| 1192 | @@ -6820,14 +6819,14 @@ float3 __ovld __cnfn cbrt(float3); | ||
| 1193 | float4 __ovld __cnfn cbrt(float4); | ||
| 1194 | float8 __ovld __cnfn cbrt(float8); | ||
| 1195 | float16 __ovld __cnfn cbrt(float16); | ||
| 1196 | -#ifdef cl_khr_fp64 | ||
| 1197 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1198 | double __ovld __cnfn cbrt(double); | ||
| 1199 | double2 __ovld __cnfn cbrt(double2); | ||
| 1200 | double3 __ovld __cnfn cbrt(double3); | ||
| 1201 | double4 __ovld __cnfn cbrt(double4); | ||
| 1202 | double8 __ovld __cnfn cbrt(double8); | ||
| 1203 | double16 __ovld __cnfn cbrt(double16); | ||
| 1204 | -#endif //cl_khr_fp64 | ||
| 1205 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1206 | #ifdef cl_khr_fp16 | ||
| 1207 | half __ovld __cnfn cbrt(half); | ||
| 1208 | half2 __ovld __cnfn cbrt(half2); | ||
| 1209 | @@ -6847,14 +6846,14 @@ float3 __ovld __cnfn ceil(float3); | ||
| 1210 | float4 __ovld __cnfn ceil(float4); | ||
| 1211 | float8 __ovld __cnfn ceil(float8); | ||
| 1212 | float16 __ovld __cnfn ceil(float16); | ||
| 1213 | -#ifdef cl_khr_fp64 | ||
| 1214 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1215 | double __ovld __cnfn ceil(double); | ||
| 1216 | double2 __ovld __cnfn ceil(double2); | ||
| 1217 | double3 __ovld __cnfn ceil(double3); | ||
| 1218 | double4 __ovld __cnfn ceil(double4); | ||
| 1219 | double8 __ovld __cnfn ceil(double8); | ||
| 1220 | double16 __ovld __cnfn ceil(double16); | ||
| 1221 | -#endif //cl_khr_fp64 | ||
| 1222 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1223 | #ifdef cl_khr_fp16 | ||
| 1224 | half __ovld __cnfn ceil(half); | ||
| 1225 | half2 __ovld __cnfn ceil(half2); | ||
| 1226 | @@ -6873,14 +6872,14 @@ float3 __ovld __cnfn copysign(float3 x, float3 y); | ||
| 1227 | float4 __ovld __cnfn copysign(float4 x, float4 y); | ||
| 1228 | float8 __ovld __cnfn copysign(float8 x, float8 y); | ||
| 1229 | float16 __ovld __cnfn copysign(float16 x, float16 y); | ||
| 1230 | -#ifdef cl_khr_fp64 | ||
| 1231 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1232 | double __ovld __cnfn copysign(double x, double y); | ||
| 1233 | double2 __ovld __cnfn copysign(double2 x, double2 y); | ||
| 1234 | double3 __ovld __cnfn copysign(double3 x, double3 y); | ||
| 1235 | double4 __ovld __cnfn copysign(double4 x, double4 y); | ||
| 1236 | double8 __ovld __cnfn copysign(double8 x, double8 y); | ||
| 1237 | double16 __ovld __cnfn copysign(double16 x, double16 y); | ||
| 1238 | -#endif //cl_khr_fp64 | ||
| 1239 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1240 | #ifdef cl_khr_fp16 | ||
| 1241 | half __ovld __cnfn copysign(half x, half y); | ||
| 1242 | half2 __ovld __cnfn copysign(half2 x, half2 y); | ||
| 1243 | @@ -6899,14 +6898,14 @@ float3 __ovld __cnfn cos(float3); | ||
| 1244 | float4 __ovld __cnfn cos(float4); | ||
| 1245 | float8 __ovld __cnfn cos(float8); | ||
| 1246 | float16 __ovld __cnfn cos(float16); | ||
| 1247 | -#ifdef cl_khr_fp64 | ||
| 1248 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1249 | double __ovld __cnfn cos(double); | ||
| 1250 | double2 __ovld __cnfn cos(double2); | ||
| 1251 | double3 __ovld __cnfn cos(double3); | ||
| 1252 | double4 __ovld __cnfn cos(double4); | ||
| 1253 | double8 __ovld __cnfn cos(double8); | ||
| 1254 | double16 __ovld __cnfn cos(double16); | ||
| 1255 | -#endif //cl_khr_fp64 | ||
| 1256 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1257 | #ifdef cl_khr_fp16 | ||
| 1258 | half __ovld __cnfn cos(half); | ||
| 1259 | half2 __ovld __cnfn cos(half2); | ||
| 1260 | @@ -6925,14 +6924,14 @@ float3 __ovld __cnfn cosh(float3); | ||
| 1261 | float4 __ovld __cnfn cosh(float4); | ||
| 1262 | float8 __ovld __cnfn cosh(float8); | ||
| 1263 | float16 __ovld __cnfn cosh(float16); | ||
| 1264 | -#ifdef cl_khr_fp64 | ||
| 1265 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1266 | double __ovld __cnfn cosh(double); | ||
| 1267 | double2 __ovld __cnfn cosh(double2); | ||
| 1268 | double3 __ovld __cnfn cosh(double3); | ||
| 1269 | double4 __ovld __cnfn cosh(double4); | ||
| 1270 | double8 __ovld __cnfn cosh(double8); | ||
| 1271 | double16 __ovld __cnfn cosh(double16); | ||
| 1272 | -#endif //cl_khr_fp64 | ||
| 1273 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1274 | #ifdef cl_khr_fp16 | ||
| 1275 | half __ovld __cnfn cosh(half); | ||
| 1276 | half2 __ovld __cnfn cosh(half2); | ||
| 1277 | @@ -6951,14 +6950,14 @@ float3 __ovld __cnfn cospi(float3 x); | ||
| 1278 | float4 __ovld __cnfn cospi(float4 x); | ||
| 1279 | float8 __ovld __cnfn cospi(float8 x); | ||
| 1280 | float16 __ovld __cnfn cospi(float16 x); | ||
| 1281 | -#ifdef cl_khr_fp64 | ||
| 1282 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1283 | double __ovld __cnfn cospi(double x); | ||
| 1284 | double2 __ovld __cnfn cospi(double2 x); | ||
| 1285 | double3 __ovld __cnfn cospi(double3 x); | ||
| 1286 | double4 __ovld __cnfn cospi(double4 x); | ||
| 1287 | double8 __ovld __cnfn cospi(double8 x); | ||
| 1288 | double16 __ovld __cnfn cospi(double16 x); | ||
| 1289 | -#endif //cl_khr_fp64 | ||
| 1290 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1291 | #ifdef cl_khr_fp16 | ||
| 1292 | half __ovld __cnfn cospi(half x); | ||
| 1293 | half2 __ovld __cnfn cospi(half2 x); | ||
| 1294 | @@ -6977,14 +6976,14 @@ float3 __ovld __cnfn erfc(float3); | ||
| 1295 | float4 __ovld __cnfn erfc(float4); | ||
| 1296 | float8 __ovld __cnfn erfc(float8); | ||
| 1297 | float16 __ovld __cnfn erfc(float16); | ||
| 1298 | -#ifdef cl_khr_fp64 | ||
| 1299 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1300 | double __ovld __cnfn erfc(double); | ||
| 1301 | double2 __ovld __cnfn erfc(double2); | ||
| 1302 | double3 __ovld __cnfn erfc(double3); | ||
| 1303 | double4 __ovld __cnfn erfc(double4); | ||
| 1304 | double8 __ovld __cnfn erfc(double8); | ||
| 1305 | double16 __ovld __cnfn erfc(double16); | ||
| 1306 | -#endif //cl_khr_fp64 | ||
| 1307 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1308 | #ifdef cl_khr_fp16 | ||
| 1309 | half __ovld __cnfn erfc(half); | ||
| 1310 | half2 __ovld __cnfn erfc(half2); | ||
| 1311 | @@ -7004,14 +7003,14 @@ float3 __ovld __cnfn erf(float3); | ||
| 1312 | float4 __ovld __cnfn erf(float4); | ||
| 1313 | float8 __ovld __cnfn erf(float8); | ||
| 1314 | float16 __ovld __cnfn erf(float16); | ||
| 1315 | -#ifdef cl_khr_fp64 | ||
| 1316 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1317 | double __ovld __cnfn erf(double); | ||
| 1318 | double2 __ovld __cnfn erf(double2); | ||
| 1319 | double3 __ovld __cnfn erf(double3); | ||
| 1320 | double4 __ovld __cnfn erf(double4); | ||
| 1321 | double8 __ovld __cnfn erf(double8); | ||
| 1322 | double16 __ovld __cnfn erf(double16); | ||
| 1323 | -#endif //cl_khr_fp64 | ||
| 1324 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1325 | #ifdef cl_khr_fp16 | ||
| 1326 | half __ovld __cnfn erf(half); | ||
| 1327 | half2 __ovld __cnfn erf(half2); | ||
| 1328 | @@ -7030,14 +7029,14 @@ float3 __ovld __cnfn exp(float3 x); | ||
| 1329 | float4 __ovld __cnfn exp(float4 x); | ||
| 1330 | float8 __ovld __cnfn exp(float8 x); | ||
| 1331 | float16 __ovld __cnfn exp(float16 x); | ||
| 1332 | -#ifdef cl_khr_fp64 | ||
| 1333 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1334 | double __ovld __cnfn exp(double x); | ||
| 1335 | double2 __ovld __cnfn exp(double2 x); | ||
| 1336 | double3 __ovld __cnfn exp(double3 x); | ||
| 1337 | double4 __ovld __cnfn exp(double4 x); | ||
| 1338 | double8 __ovld __cnfn exp(double8 x); | ||
| 1339 | double16 __ovld __cnfn exp(double16 x); | ||
| 1340 | -#endif //cl_khr_fp64 | ||
| 1341 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1342 | #ifdef cl_khr_fp16 | ||
| 1343 | half __ovld __cnfn exp(half x); | ||
| 1344 | half2 __ovld __cnfn exp(half2 x); | ||
| 1345 | @@ -7056,14 +7055,14 @@ float3 __ovld __cnfn exp2(float3); | ||
| 1346 | float4 __ovld __cnfn exp2(float4); | ||
| 1347 | float8 __ovld __cnfn exp2(float8); | ||
| 1348 | float16 __ovld __cnfn exp2(float16); | ||
| 1349 | -#ifdef cl_khr_fp64 | ||
| 1350 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1351 | double __ovld __cnfn exp2(double); | ||
| 1352 | double2 __ovld __cnfn exp2(double2); | ||
| 1353 | double3 __ovld __cnfn exp2(double3); | ||
| 1354 | double4 __ovld __cnfn exp2(double4); | ||
| 1355 | double8 __ovld __cnfn exp2(double8); | ||
| 1356 | double16 __ovld __cnfn exp2(double16); | ||
| 1357 | -#endif //cl_khr_fp64 | ||
| 1358 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1359 | #ifdef cl_khr_fp16 | ||
| 1360 | half __ovld __cnfn exp2(half); | ||
| 1361 | half2 __ovld __cnfn exp2(half2); | ||
| 1362 | @@ -7082,14 +7081,14 @@ float3 __ovld __cnfn exp10(float3); | ||
| 1363 | float4 __ovld __cnfn exp10(float4); | ||
| 1364 | float8 __ovld __cnfn exp10(float8); | ||
| 1365 | float16 __ovld __cnfn exp10(float16); | ||
| 1366 | -#ifdef cl_khr_fp64 | ||
| 1367 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1368 | double __ovld __cnfn exp10(double); | ||
| 1369 | double2 __ovld __cnfn exp10(double2); | ||
| 1370 | double3 __ovld __cnfn exp10(double3); | ||
| 1371 | double4 __ovld __cnfn exp10(double4); | ||
| 1372 | double8 __ovld __cnfn exp10(double8); | ||
| 1373 | double16 __ovld __cnfn exp10(double16); | ||
| 1374 | -#endif //cl_khr_fp64 | ||
| 1375 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1376 | #ifdef cl_khr_fp16 | ||
| 1377 | half __ovld __cnfn exp10(half); | ||
| 1378 | half2 __ovld __cnfn exp10(half2); | ||
| 1379 | @@ -7108,14 +7107,14 @@ float3 __ovld __cnfn expm1(float3 x); | ||
| 1380 | float4 __ovld __cnfn expm1(float4 x); | ||
| 1381 | float8 __ovld __cnfn expm1(float8 x); | ||
| 1382 | float16 __ovld __cnfn expm1(float16 x); | ||
| 1383 | -#ifdef cl_khr_fp64 | ||
| 1384 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1385 | double __ovld __cnfn expm1(double x); | ||
| 1386 | double2 __ovld __cnfn expm1(double2 x); | ||
| 1387 | double3 __ovld __cnfn expm1(double3 x); | ||
| 1388 | double4 __ovld __cnfn expm1(double4 x); | ||
| 1389 | double8 __ovld __cnfn expm1(double8 x); | ||
| 1390 | double16 __ovld __cnfn expm1(double16 x); | ||
| 1391 | -#endif //cl_khr_fp64 | ||
| 1392 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1393 | #ifdef cl_khr_fp16 | ||
| 1394 | half __ovld __cnfn expm1(half x); | ||
| 1395 | half2 __ovld __cnfn expm1(half2 x); | ||
| 1396 | @@ -7134,14 +7133,14 @@ float3 __ovld __cnfn fabs(float3); | ||
| 1397 | float4 __ovld __cnfn fabs(float4); | ||
| 1398 | float8 __ovld __cnfn fabs(float8); | ||
| 1399 | float16 __ovld __cnfn fabs(float16); | ||
| 1400 | -#ifdef cl_khr_fp64 | ||
| 1401 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1402 | double __ovld __cnfn fabs(double); | ||
| 1403 | double2 __ovld __cnfn fabs(double2); | ||
| 1404 | double3 __ovld __cnfn fabs(double3); | ||
| 1405 | double4 __ovld __cnfn fabs(double4); | ||
| 1406 | double8 __ovld __cnfn fabs(double8); | ||
| 1407 | double16 __ovld __cnfn fabs(double16); | ||
| 1408 | -#endif //cl_khr_fp64 | ||
| 1409 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1410 | #ifdef cl_khr_fp16 | ||
| 1411 | half __ovld __cnfn fabs(half); | ||
| 1412 | half2 __ovld __cnfn fabs(half2); | ||
| 1413 | @@ -7160,14 +7159,14 @@ float3 __ovld __cnfn fdim(float3 x, float3 y); | ||
| 1414 | float4 __ovld __cnfn fdim(float4 x, float4 y); | ||
| 1415 | float8 __ovld __cnfn fdim(float8 x, float8 y); | ||
| 1416 | float16 __ovld __cnfn fdim(float16 x, float16 y); | ||
| 1417 | -#ifdef cl_khr_fp64 | ||
| 1418 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1419 | double __ovld __cnfn fdim(double x, double y); | ||
| 1420 | double2 __ovld __cnfn fdim(double2 x, double2 y); | ||
| 1421 | double3 __ovld __cnfn fdim(double3 x, double3 y); | ||
| 1422 | double4 __ovld __cnfn fdim(double4 x, double4 y); | ||
| 1423 | double8 __ovld __cnfn fdim(double8 x, double8 y); | ||
| 1424 | double16 __ovld __cnfn fdim(double16 x, double16 y); | ||
| 1425 | -#endif //cl_khr_fp64 | ||
| 1426 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1427 | #ifdef cl_khr_fp16 | ||
| 1428 | half __ovld __cnfn fdim(half x, half y); | ||
| 1429 | half2 __ovld __cnfn fdim(half2 x, half2 y); | ||
| 1430 | @@ -7187,14 +7186,14 @@ float3 __ovld __cnfn floor(float3); | ||
| 1431 | float4 __ovld __cnfn floor(float4); | ||
| 1432 | float8 __ovld __cnfn floor(float8); | ||
| 1433 | float16 __ovld __cnfn floor(float16); | ||
| 1434 | -#ifdef cl_khr_fp64 | ||
| 1435 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1436 | double __ovld __cnfn floor(double); | ||
| 1437 | double2 __ovld __cnfn floor(double2); | ||
| 1438 | double3 __ovld __cnfn floor(double3); | ||
| 1439 | double4 __ovld __cnfn floor(double4); | ||
| 1440 | double8 __ovld __cnfn floor(double8); | ||
| 1441 | double16 __ovld __cnfn floor(double16); | ||
| 1442 | -#endif //cl_khr_fp64 | ||
| 1443 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1444 | #ifdef cl_khr_fp16 | ||
| 1445 | half __ovld __cnfn floor(half); | ||
| 1446 | half2 __ovld __cnfn floor(half2); | ||
| 1447 | @@ -7217,14 +7216,14 @@ float3 __ovld __cnfn fma(float3 a, float3 b, float3 c); | ||
| 1448 | float4 __ovld __cnfn fma(float4 a, float4 b, float4 c); | ||
| 1449 | float8 __ovld __cnfn fma(float8 a, float8 b, float8 c); | ||
| 1450 | float16 __ovld __cnfn fma(float16 a, float16 b, float16 c); | ||
| 1451 | -#ifdef cl_khr_fp64 | ||
| 1452 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1453 | double __ovld __cnfn fma(double a, double b, double c); | ||
| 1454 | double2 __ovld __cnfn fma(double2 a, double2 b, double2 c); | ||
| 1455 | double3 __ovld __cnfn fma(double3 a, double3 b, double3 c); | ||
| 1456 | double4 __ovld __cnfn fma(double4 a, double4 b, double4 c); | ||
| 1457 | double8 __ovld __cnfn fma(double8 a, double8 b, double8 c); | ||
| 1458 | double16 __ovld __cnfn fma(double16 a, double16 b, double16 c); | ||
| 1459 | -#endif //cl_khr_fp64 | ||
| 1460 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1461 | #ifdef cl_khr_fp16 | ||
| 1462 | half __ovld __cnfn fma(half a, half b, half c); | ||
| 1463 | half2 __ovld __cnfn fma(half2 a, half2 b, half2 c); | ||
| 1464 | @@ -7251,7 +7250,7 @@ float3 __ovld __cnfn fmax(float3 x, float y); | ||
| 1465 | float4 __ovld __cnfn fmax(float4 x, float y); | ||
| 1466 | float8 __ovld __cnfn fmax(float8 x, float y); | ||
| 1467 | float16 __ovld __cnfn fmax(float16 x, float y); | ||
| 1468 | -#ifdef cl_khr_fp64 | ||
| 1469 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1470 | double __ovld __cnfn fmax(double x, double y); | ||
| 1471 | double2 __ovld __cnfn fmax(double2 x, double2 y); | ||
| 1472 | double3 __ovld __cnfn fmax(double3 x, double3 y); | ||
| 1473 | @@ -7263,7 +7262,7 @@ double3 __ovld __cnfn fmax(double3 x, double y); | ||
| 1474 | double4 __ovld __cnfn fmax(double4 x, double y); | ||
| 1475 | double8 __ovld __cnfn fmax(double8 x, double y); | ||
| 1476 | double16 __ovld __cnfn fmax(double16 x, double y); | ||
| 1477 | -#endif //cl_khr_fp64 | ||
| 1478 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1479 | #ifdef cl_khr_fp16 | ||
| 1480 | half __ovld __cnfn fmax(half x, half y); | ||
| 1481 | half2 __ovld __cnfn fmax(half2 x, half2 y); | ||
| 1482 | @@ -7295,7 +7294,7 @@ float3 __ovld __cnfn fmin(float3 x, float y); | ||
| 1483 | float4 __ovld __cnfn fmin(float4 x, float y); | ||
| 1484 | float8 __ovld __cnfn fmin(float8 x, float y); | ||
| 1485 | float16 __ovld __cnfn fmin(float16 x, float y); | ||
| 1486 | -#ifdef cl_khr_fp64 | ||
| 1487 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1488 | double __ovld __cnfn fmin(double x, double y); | ||
| 1489 | double2 __ovld __cnfn fmin(double2 x, double2 y); | ||
| 1490 | double3 __ovld __cnfn fmin(double3 x, double3 y); | ||
| 1491 | @@ -7307,7 +7306,7 @@ double3 __ovld __cnfn fmin(double3 x, double y); | ||
| 1492 | double4 __ovld __cnfn fmin(double4 x, double y); | ||
| 1493 | double8 __ovld __cnfn fmin(double8 x, double y); | ||
| 1494 | double16 __ovld __cnfn fmin(double16 x, double y); | ||
| 1495 | -#endif //cl_khr_fp64 | ||
| 1496 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1497 | #ifdef cl_khr_fp16 | ||
| 1498 | half __ovld __cnfn fmin(half x, half y); | ||
| 1499 | half2 __ovld __cnfn fmin(half2 x, half2 y); | ||
| 1500 | @@ -7331,14 +7330,14 @@ float3 __ovld __cnfn fmod(float3 x, float3 y); | ||
| 1501 | float4 __ovld __cnfn fmod(float4 x, float4 y); | ||
| 1502 | float8 __ovld __cnfn fmod(float8 x, float8 y); | ||
| 1503 | float16 __ovld __cnfn fmod(float16 x, float16 y); | ||
| 1504 | -#ifdef cl_khr_fp64 | ||
| 1505 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1506 | double __ovld __cnfn fmod(double x, double y); | ||
| 1507 | double2 __ovld __cnfn fmod(double2 x, double2 y); | ||
| 1508 | double3 __ovld __cnfn fmod(double3 x, double3 y); | ||
| 1509 | double4 __ovld __cnfn fmod(double4 x, double4 y); | ||
| 1510 | double8 __ovld __cnfn fmod(double8 x, double8 y); | ||
| 1511 | double16 __ovld __cnfn fmod(double16 x, double16 y); | ||
| 1512 | -#endif //cl_khr_fp64 | ||
| 1513 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1514 | #ifdef cl_khr_fp16 | ||
| 1515 | half __ovld __cnfn fmod(half x, half y); | ||
| 1516 | half2 __ovld __cnfn fmod(half2 x, half2 y); | ||
| 1517 | @@ -7352,21 +7351,21 @@ half16 __ovld __cnfn fmod(half16 x, half16 y); | ||
| 1518 | * Returns fmin(x - floor (x), 0x1.fffffep-1f ). | ||
| 1519 | * floor(x) is returned in iptr. | ||
| 1520 | */ | ||
| 1521 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1522 | +#ifdef __opencl_c_generic_address_space | ||
| 1523 | float __ovld fract(float x, float *iptr); | ||
| 1524 | float2 __ovld fract(float2 x, float2 *iptr); | ||
| 1525 | float3 __ovld fract(float3 x, float3 *iptr); | ||
| 1526 | float4 __ovld fract(float4 x, float4 *iptr); | ||
| 1527 | float8 __ovld fract(float8 x, float8 *iptr); | ||
| 1528 | float16 __ovld fract(float16 x, float16 *iptr); | ||
| 1529 | -#ifdef cl_khr_fp64 | ||
| 1530 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1531 | double __ovld fract(double x, double *iptr); | ||
| 1532 | double2 __ovld fract(double2 x, double2 *iptr); | ||
| 1533 | double3 __ovld fract(double3 x, double3 *iptr); | ||
| 1534 | double4 __ovld fract(double4 x, double4 *iptr); | ||
| 1535 | double8 __ovld fract(double8 x, double8 *iptr); | ||
| 1536 | double16 __ovld fract(double16 x, double16 *iptr); | ||
| 1537 | -#endif //cl_khr_fp64 | ||
| 1538 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1539 | #ifdef cl_khr_fp16 | ||
| 1540 | half __ovld fract(half x, half *iptr); | ||
| 1541 | half2 __ovld fract(half2 x, half2 *iptr); | ||
| 1542 | @@ -7375,7 +7374,9 @@ half4 __ovld fract(half4 x, half4 *iptr); | ||
| 1543 | half8 __ovld fract(half8 x, half8 *iptr); | ||
| 1544 | half16 __ovld fract(half16 x, half16 *iptr); | ||
| 1545 | #endif //cl_khr_fp16 | ||
| 1546 | -#else | ||
| 1547 | +#endif //__opencl_c_generic_address_space | ||
| 1548 | + | ||
| 1549 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1550 | float __ovld fract(float x, __global float *iptr); | ||
| 1551 | float2 __ovld fract(float2 x, __global float2 *iptr); | ||
| 1552 | float3 __ovld fract(float3 x, __global float3 *iptr); | ||
| 1553 | @@ -7394,7 +7395,7 @@ float3 __ovld fract(float3 x, __private float3 *iptr); | ||
| 1554 | float4 __ovld fract(float4 x, __private float4 *iptr); | ||
| 1555 | float8 __ovld fract(float8 x, __private float8 *iptr); | ||
| 1556 | float16 __ovld fract(float16 x, __private float16 *iptr); | ||
| 1557 | -#ifdef cl_khr_fp64 | ||
| 1558 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1559 | double __ovld fract(double x, __global double *iptr); | ||
| 1560 | double2 __ovld fract(double2 x, __global double2 *iptr); | ||
| 1561 | double3 __ovld fract(double3 x, __global double3 *iptr); | ||
| 1562 | @@ -7413,7 +7414,7 @@ double3 __ovld fract(double3 x, __private double3 *iptr); | ||
| 1563 | double4 __ovld fract(double4 x, __private double4 *iptr); | ||
| 1564 | double8 __ovld fract(double8 x, __private double8 *iptr); | ||
| 1565 | double16 __ovld fract(double16 x, __private double16 *iptr); | ||
| 1566 | -#endif //cl_khr_fp64 | ||
| 1567 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1568 | #ifdef cl_khr_fp16 | ||
| 1569 | half __ovld fract(half x, __global half *iptr); | ||
| 1570 | half2 __ovld fract(half2 x, __global half2 *iptr); | ||
| 1571 | @@ -7434,29 +7435,29 @@ half4 __ovld fract(half4 x, __private half4 *iptr); | ||
| 1572 | half8 __ovld fract(half8 x, __private half8 *iptr); | ||
| 1573 | half16 __ovld fract(half16 x, __private half16 *iptr); | ||
| 1574 | #endif //cl_khr_fp16 | ||
| 1575 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1576 | - | ||
| 1577 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1578 | + //! CL_VERSION_2_0) | ||
| 1579 | /** | ||
| 1580 | * Extract mantissa and exponent from x. For each | ||
| 1581 | * component the mantissa returned is a float with | ||
| 1582 | * magnitude in the interval [1/2, 1) or 0. Each | ||
| 1583 | * component of x equals mantissa returned * 2^exp. | ||
| 1584 | */ | ||
| 1585 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1586 | +#ifdef __opencl_c_generic_address_space | ||
| 1587 | float __ovld frexp(float x, int *exp); | ||
| 1588 | float2 __ovld frexp(float2 x, int2 *exp); | ||
| 1589 | float3 __ovld frexp(float3 x, int3 *exp); | ||
| 1590 | float4 __ovld frexp(float4 x, int4 *exp); | ||
| 1591 | float8 __ovld frexp(float8 x, int8 *exp); | ||
| 1592 | float16 __ovld frexp(float16 x, int16 *exp); | ||
| 1593 | -#ifdef cl_khr_fp64 | ||
| 1594 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1595 | double __ovld frexp(double x, int *exp); | ||
| 1596 | double2 __ovld frexp(double2 x, int2 *exp); | ||
| 1597 | double3 __ovld frexp(double3 x, int3 *exp); | ||
| 1598 | double4 __ovld frexp(double4 x, int4 *exp); | ||
| 1599 | double8 __ovld frexp(double8 x, int8 *exp); | ||
| 1600 | double16 __ovld frexp(double16 x, int16 *exp); | ||
| 1601 | -#endif //cl_khr_fp64 | ||
| 1602 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1603 | #ifdef cl_khr_fp16 | ||
| 1604 | half __ovld frexp(half x, int *exp); | ||
| 1605 | half2 __ovld frexp(half2 x, int2 *exp); | ||
| 1606 | @@ -7465,7 +7466,9 @@ half4 __ovld frexp(half4 x, int4 *exp); | ||
| 1607 | half8 __ovld frexp(half8 x, int8 *exp); | ||
| 1608 | half16 __ovld frexp(half16 x, int16 *exp); | ||
| 1609 | #endif //cl_khr_fp16 | ||
| 1610 | -#else | ||
| 1611 | +#endif //__opencl_c_generic_address_space | ||
| 1612 | + | ||
| 1613 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1614 | float __ovld frexp(float x, __global int *exp); | ||
| 1615 | float2 __ovld frexp(float2 x, __global int2 *exp); | ||
| 1616 | float3 __ovld frexp(float3 x, __global int3 *exp); | ||
| 1617 | @@ -7484,7 +7487,7 @@ float3 __ovld frexp(float3 x, __private int3 *exp); | ||
| 1618 | float4 __ovld frexp(float4 x, __private int4 *exp); | ||
| 1619 | float8 __ovld frexp(float8 x, __private int8 *exp); | ||
| 1620 | float16 __ovld frexp(float16 x, __private int16 *exp); | ||
| 1621 | -#ifdef cl_khr_fp64 | ||
| 1622 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1623 | double __ovld frexp(double x, __global int *exp); | ||
| 1624 | double2 __ovld frexp(double2 x, __global int2 *exp); | ||
| 1625 | double3 __ovld frexp(double3 x, __global int3 *exp); | ||
| 1626 | @@ -7503,7 +7506,7 @@ double3 __ovld frexp(double3 x, __private int3 *exp); | ||
| 1627 | double4 __ovld frexp(double4 x, __private int4 *exp); | ||
| 1628 | double8 __ovld frexp(double8 x, __private int8 *exp); | ||
| 1629 | double16 __ovld frexp(double16 x, __private int16 *exp); | ||
| 1630 | -#endif //cl_khr_fp64 | ||
| 1631 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1632 | #ifdef cl_khr_fp16 | ||
| 1633 | half __ovld frexp(half x, __global int *exp); | ||
| 1634 | half2 __ovld frexp(half2 x, __global int2 *exp); | ||
| 1635 | @@ -7524,7 +7527,8 @@ half4 __ovld frexp(half4 x, __private int4 *exp); | ||
| 1636 | half8 __ovld frexp(half8 x, __private int8 *exp); | ||
| 1637 | half16 __ovld frexp(half16 x, __private int16 *exp); | ||
| 1638 | #endif //cl_khr_fp16 | ||
| 1639 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1640 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1641 | + //! CL_VERSION_2_0) | ||
| 1642 | |||
| 1643 | /** | ||
| 1644 | * Compute the value of the square root of x^2 + y^2 | ||
| 1645 | @@ -7536,14 +7540,14 @@ float3 __ovld __cnfn hypot(float3 x, float3 y); | ||
| 1646 | float4 __ovld __cnfn hypot(float4 x, float4 y); | ||
| 1647 | float8 __ovld __cnfn hypot(float8 x, float8 y); | ||
| 1648 | float16 __ovld __cnfn hypot(float16 x, float16 y); | ||
| 1649 | -#ifdef cl_khr_fp64 | ||
| 1650 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1651 | double __ovld __cnfn hypot(double x, double y); | ||
| 1652 | double2 __ovld __cnfn hypot(double2 x, double2 y); | ||
| 1653 | double3 __ovld __cnfn hypot(double3 x, double3 y); | ||
| 1654 | double4 __ovld __cnfn hypot(double4 x, double4 y); | ||
| 1655 | double8 __ovld __cnfn hypot(double8 x, double8 y); | ||
| 1656 | double16 __ovld __cnfn hypot(double16 x, double16 y); | ||
| 1657 | -#endif //cl_khr_fp64 | ||
| 1658 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1659 | #ifdef cl_khr_fp16 | ||
| 1660 | half __ovld __cnfn hypot(half x, half y); | ||
| 1661 | half2 __ovld __cnfn hypot(half2 x, half2 y); | ||
| 1662 | @@ -7562,14 +7566,14 @@ int3 __ovld __cnfn ilogb(float3 x); | ||
| 1663 | int4 __ovld __cnfn ilogb(float4 x); | ||
| 1664 | int8 __ovld __cnfn ilogb(float8 x); | ||
| 1665 | int16 __ovld __cnfn ilogb(float16 x); | ||
| 1666 | -#ifdef cl_khr_fp64 | ||
| 1667 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1668 | int __ovld __cnfn ilogb(double x); | ||
| 1669 | int2 __ovld __cnfn ilogb(double2 x); | ||
| 1670 | int3 __ovld __cnfn ilogb(double3 x); | ||
| 1671 | int4 __ovld __cnfn ilogb(double4 x); | ||
| 1672 | int8 __ovld __cnfn ilogb(double8 x); | ||
| 1673 | int16 __ovld __cnfn ilogb(double16 x); | ||
| 1674 | -#endif //cl_khr_fp64 | ||
| 1675 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1676 | #ifdef cl_khr_fp16 | ||
| 1677 | int __ovld __cnfn ilogb(half x); | ||
| 1678 | int2 __ovld __cnfn ilogb(half2 x); | ||
| 1679 | @@ -7593,7 +7597,7 @@ float3 __ovld __cnfn ldexp(float3 x, int n); | ||
| 1680 | float4 __ovld __cnfn ldexp(float4 x, int n); | ||
| 1681 | float8 __ovld __cnfn ldexp(float8 x, int n); | ||
| 1682 | float16 __ovld __cnfn ldexp(float16 x, int n); | ||
| 1683 | -#ifdef cl_khr_fp64 | ||
| 1684 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1685 | double __ovld __cnfn ldexp(double x, int n); | ||
| 1686 | double2 __ovld __cnfn ldexp(double2 x, int2 n); | ||
| 1687 | double3 __ovld __cnfn ldexp(double3 x, int3 n); | ||
| 1688 | @@ -7605,7 +7609,7 @@ double3 __ovld __cnfn ldexp(double3 x, int n); | ||
| 1689 | double4 __ovld __cnfn ldexp(double4 x, int n); | ||
| 1690 | double8 __ovld __cnfn ldexp(double8 x, int n); | ||
| 1691 | double16 __ovld __cnfn ldexp(double16 x, int n); | ||
| 1692 | -#endif //cl_khr_fp64 | ||
| 1693 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1694 | #ifdef cl_khr_fp16 | ||
| 1695 | half __ovld __cnfn ldexp(half x, int n); | ||
| 1696 | half2 __ovld __cnfn ldexp(half2 x, int2 n); | ||
| 1697 | @@ -7632,14 +7636,14 @@ float3 __ovld __cnfn lgamma(float3 x); | ||
| 1698 | float4 __ovld __cnfn lgamma(float4 x); | ||
| 1699 | float8 __ovld __cnfn lgamma(float8 x); | ||
| 1700 | float16 __ovld __cnfn lgamma(float16 x); | ||
| 1701 | -#ifdef cl_khr_fp64 | ||
| 1702 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1703 | double __ovld __cnfn lgamma(double x); | ||
| 1704 | double2 __ovld __cnfn lgamma(double2 x); | ||
| 1705 | double3 __ovld __cnfn lgamma(double3 x); | ||
| 1706 | double4 __ovld __cnfn lgamma(double4 x); | ||
| 1707 | double8 __ovld __cnfn lgamma(double8 x); | ||
| 1708 | double16 __ovld __cnfn lgamma(double16 x); | ||
| 1709 | -#endif //cl_khr_fp64 | ||
| 1710 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1711 | #ifdef cl_khr_fp16 | ||
| 1712 | half __ovld __cnfn lgamma(half x); | ||
| 1713 | half2 __ovld __cnfn lgamma(half2 x); | ||
| 1714 | @@ -7649,21 +7653,21 @@ half8 __ovld __cnfn lgamma(half8 x); | ||
| 1715 | half16 __ovld __cnfn lgamma(half16 x); | ||
| 1716 | #endif //cl_khr_fp16 | ||
| 1717 | |||
| 1718 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1719 | +#ifdef __opencl_c_generic_address_space | ||
| 1720 | float __ovld lgamma_r(float x, int *signp); | ||
| 1721 | float2 __ovld lgamma_r(float2 x, int2 *signp); | ||
| 1722 | float3 __ovld lgamma_r(float3 x, int3 *signp); | ||
| 1723 | float4 __ovld lgamma_r(float4 x, int4 *signp); | ||
| 1724 | float8 __ovld lgamma_r(float8 x, int8 *signp); | ||
| 1725 | float16 __ovld lgamma_r(float16 x, int16 *signp); | ||
| 1726 | -#ifdef cl_khr_fp64 | ||
| 1727 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1728 | double __ovld lgamma_r(double x, int *signp); | ||
| 1729 | double2 __ovld lgamma_r(double2 x, int2 *signp); | ||
| 1730 | double3 __ovld lgamma_r(double3 x, int3 *signp); | ||
| 1731 | double4 __ovld lgamma_r(double4 x, int4 *signp); | ||
| 1732 | double8 __ovld lgamma_r(double8 x, int8 *signp); | ||
| 1733 | double16 __ovld lgamma_r(double16 x, int16 *signp); | ||
| 1734 | -#endif //cl_khr_fp64 | ||
| 1735 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1736 | #ifdef cl_khr_fp16 | ||
| 1737 | half __ovld lgamma_r(half x, int *signp); | ||
| 1738 | half2 __ovld lgamma_r(half2 x, int2 *signp); | ||
| 1739 | @@ -7672,7 +7676,9 @@ half4 __ovld lgamma_r(half4 x, int4 *signp); | ||
| 1740 | half8 __ovld lgamma_r(half8 x, int8 *signp); | ||
| 1741 | half16 __ovld lgamma_r(half16 x, int16 *signp); | ||
| 1742 | #endif //cl_khr_fp16 | ||
| 1743 | -#else | ||
| 1744 | +#endif //__opencl_c_generic_address_space | ||
| 1745 | + | ||
| 1746 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1747 | float __ovld lgamma_r(float x, __global int *signp); | ||
| 1748 | float2 __ovld lgamma_r(float2 x, __global int2 *signp); | ||
| 1749 | float3 __ovld lgamma_r(float3 x, __global int3 *signp); | ||
| 1750 | @@ -7691,7 +7697,7 @@ float3 __ovld lgamma_r(float3 x, __private int3 *signp); | ||
| 1751 | float4 __ovld lgamma_r(float4 x, __private int4 *signp); | ||
| 1752 | float8 __ovld lgamma_r(float8 x, __private int8 *signp); | ||
| 1753 | float16 __ovld lgamma_r(float16 x, __private int16 *signp); | ||
| 1754 | -#ifdef cl_khr_fp64 | ||
| 1755 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1756 | double __ovld lgamma_r(double x, __global int *signp); | ||
| 1757 | double2 __ovld lgamma_r(double2 x, __global int2 *signp); | ||
| 1758 | double3 __ovld lgamma_r(double3 x, __global int3 *signp); | ||
| 1759 | @@ -7710,7 +7716,7 @@ double3 __ovld lgamma_r(double3 x, __private int3 *signp); | ||
| 1760 | double4 __ovld lgamma_r(double4 x, __private int4 *signp); | ||
| 1761 | double8 __ovld lgamma_r(double8 x, __private int8 *signp); | ||
| 1762 | double16 __ovld lgamma_r(double16 x, __private int16 *signp); | ||
| 1763 | -#endif //cl_khr_fp64 | ||
| 1764 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1765 | #ifdef cl_khr_fp16 | ||
| 1766 | half __ovld lgamma_r(half x, __global int *signp); | ||
| 1767 | half2 __ovld lgamma_r(half2 x, __global int2 *signp); | ||
| 1768 | @@ -7731,8 +7737,8 @@ half4 __ovld lgamma_r(half4 x, __private int4 *signp); | ||
| 1769 | half8 __ovld lgamma_r(half8 x, __private int8 *signp); | ||
| 1770 | half16 __ovld lgamma_r(half16 x, __private int16 *signp); | ||
| 1771 | #endif //cl_khr_fp16 | ||
| 1772 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1773 | - | ||
| 1774 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1775 | + //! CL_VERSION_2_0) | ||
| 1776 | /** | ||
| 1777 | * Compute natural logarithm. | ||
| 1778 | */ | ||
| 1779 | @@ -7742,14 +7748,14 @@ float3 __ovld __cnfn log(float3); | ||
| 1780 | float4 __ovld __cnfn log(float4); | ||
| 1781 | float8 __ovld __cnfn log(float8); | ||
| 1782 | float16 __ovld __cnfn log(float16); | ||
| 1783 | -#ifdef cl_khr_fp64 | ||
| 1784 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1785 | double __ovld __cnfn log(double); | ||
| 1786 | double2 __ovld __cnfn log(double2); | ||
| 1787 | double3 __ovld __cnfn log(double3); | ||
| 1788 | double4 __ovld __cnfn log(double4); | ||
| 1789 | double8 __ovld __cnfn log(double8); | ||
| 1790 | double16 __ovld __cnfn log(double16); | ||
| 1791 | -#endif //cl_khr_fp64 | ||
| 1792 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1793 | #ifdef cl_khr_fp16 | ||
| 1794 | half __ovld __cnfn log(half); | ||
| 1795 | half2 __ovld __cnfn log(half2); | ||
| 1796 | @@ -7760,7 +7766,7 @@ half16 __ovld __cnfn log(half16); | ||
| 1797 | #endif //cl_khr_fp16 | ||
| 1798 | |||
| 1799 | /** | ||
| 1800 | - * Compute a base 2 logarithm. | ||
| 1801 | + * Compute a base 2 logarithm | ||
| 1802 | */ | ||
| 1803 | float __ovld __cnfn log2(float); | ||
| 1804 | float2 __ovld __cnfn log2(float2); | ||
| 1805 | @@ -7768,14 +7774,14 @@ float3 __ovld __cnfn log2(float3); | ||
| 1806 | float4 __ovld __cnfn log2(float4); | ||
| 1807 | float8 __ovld __cnfn log2(float8); | ||
| 1808 | float16 __ovld __cnfn log2(float16); | ||
| 1809 | -#ifdef cl_khr_fp64 | ||
| 1810 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1811 | double __ovld __cnfn log2(double); | ||
| 1812 | double2 __ovld __cnfn log2(double2); | ||
| 1813 | double3 __ovld __cnfn log2(double3); | ||
| 1814 | double4 __ovld __cnfn log2(double4); | ||
| 1815 | double8 __ovld __cnfn log2(double8); | ||
| 1816 | double16 __ovld __cnfn log2(double16); | ||
| 1817 | -#endif //cl_khr_fp64 | ||
| 1818 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1819 | #ifdef cl_khr_fp16 | ||
| 1820 | half __ovld __cnfn log2(half); | ||
| 1821 | half2 __ovld __cnfn log2(half2); | ||
| 1822 | @@ -7794,14 +7800,14 @@ float3 __ovld __cnfn log10(float3); | ||
| 1823 | float4 __ovld __cnfn log10(float4); | ||
| 1824 | float8 __ovld __cnfn log10(float8); | ||
| 1825 | float16 __ovld __cnfn log10(float16); | ||
| 1826 | -#ifdef cl_khr_fp64 | ||
| 1827 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1828 | double __ovld __cnfn log10(double); | ||
| 1829 | double2 __ovld __cnfn log10(double2); | ||
| 1830 | double3 __ovld __cnfn log10(double3); | ||
| 1831 | double4 __ovld __cnfn log10(double4); | ||
| 1832 | double8 __ovld __cnfn log10(double8); | ||
| 1833 | double16 __ovld __cnfn log10(double16); | ||
| 1834 | -#endif //cl_khr_fp64 | ||
| 1835 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1836 | #ifdef cl_khr_fp16 | ||
| 1837 | half __ovld __cnfn log10(half); | ||
| 1838 | half2 __ovld __cnfn log10(half2); | ||
| 1839 | @@ -7820,14 +7826,14 @@ float3 __ovld __cnfn log1p(float3 x); | ||
| 1840 | float4 __ovld __cnfn log1p(float4 x); | ||
| 1841 | float8 __ovld __cnfn log1p(float8 x); | ||
| 1842 | float16 __ovld __cnfn log1p(float16 x); | ||
| 1843 | -#ifdef cl_khr_fp64 | ||
| 1844 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1845 | double __ovld __cnfn log1p(double x); | ||
| 1846 | double2 __ovld __cnfn log1p(double2 x); | ||
| 1847 | double3 __ovld __cnfn log1p(double3 x); | ||
| 1848 | double4 __ovld __cnfn log1p(double4 x); | ||
| 1849 | double8 __ovld __cnfn log1p(double8 x); | ||
| 1850 | double16 __ovld __cnfn log1p(double16 x); | ||
| 1851 | -#endif //cl_khr_fp64 | ||
| 1852 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1853 | #ifdef cl_khr_fp16 | ||
| 1854 | half __ovld __cnfn log1p(half x); | ||
| 1855 | half2 __ovld __cnfn log1p(half2 x); | ||
| 1856 | @@ -7847,14 +7853,14 @@ float3 __ovld __cnfn logb(float3 x); | ||
| 1857 | float4 __ovld __cnfn logb(float4 x); | ||
| 1858 | float8 __ovld __cnfn logb(float8 x); | ||
| 1859 | float16 __ovld __cnfn logb(float16 x); | ||
| 1860 | -#ifdef cl_khr_fp64 | ||
| 1861 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1862 | double __ovld __cnfn logb(double x); | ||
| 1863 | double2 __ovld __cnfn logb(double2 x); | ||
| 1864 | double3 __ovld __cnfn logb(double3 x); | ||
| 1865 | double4 __ovld __cnfn logb(double4 x); | ||
| 1866 | double8 __ovld __cnfn logb(double8 x); | ||
| 1867 | double16 __ovld __cnfn logb(double16 x); | ||
| 1868 | -#endif //cl_khr_fp64 | ||
| 1869 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1870 | #ifdef cl_khr_fp16 | ||
| 1871 | half __ovld __cnfn logb(half x); | ||
| 1872 | half2 __ovld __cnfn logb(half2 x); | ||
| 1873 | @@ -7877,14 +7883,14 @@ float3 __ovld __cnfn mad(float3 a, float3 b, float3 c); | ||
| 1874 | float4 __ovld __cnfn mad(float4 a, float4 b, float4 c); | ||
| 1875 | float8 __ovld __cnfn mad(float8 a, float8 b, float8 c); | ||
| 1876 | float16 __ovld __cnfn mad(float16 a, float16 b, float16 c); | ||
| 1877 | -#ifdef cl_khr_fp64 | ||
| 1878 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1879 | double __ovld __cnfn mad(double a, double b, double c); | ||
| 1880 | double2 __ovld __cnfn mad(double2 a, double2 b, double2 c); | ||
| 1881 | double3 __ovld __cnfn mad(double3 a, double3 b, double3 c); | ||
| 1882 | double4 __ovld __cnfn mad(double4 a, double4 b, double4 c); | ||
| 1883 | double8 __ovld __cnfn mad(double8 a, double8 b, double8 c); | ||
| 1884 | double16 __ovld __cnfn mad(double16 a, double16 b, double16 c); | ||
| 1885 | -#endif //cl_khr_fp64 | ||
| 1886 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1887 | #ifdef cl_khr_fp16 | ||
| 1888 | half __ovld __cnfn mad(half a, half b, half c); | ||
| 1889 | half2 __ovld __cnfn mad(half2 a, half2 b, half2 c); | ||
| 1890 | @@ -7904,14 +7910,14 @@ float3 __ovld __cnfn maxmag(float3 x, float3 y); | ||
| 1891 | float4 __ovld __cnfn maxmag(float4 x, float4 y); | ||
| 1892 | float8 __ovld __cnfn maxmag(float8 x, float8 y); | ||
| 1893 | float16 __ovld __cnfn maxmag(float16 x, float16 y); | ||
| 1894 | -#ifdef cl_khr_fp64 | ||
| 1895 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1896 | double __ovld __cnfn maxmag(double x, double y); | ||
| 1897 | double2 __ovld __cnfn maxmag(double2 x, double2 y); | ||
| 1898 | double3 __ovld __cnfn maxmag(double3 x, double3 y); | ||
| 1899 | double4 __ovld __cnfn maxmag(double4 x, double4 y); | ||
| 1900 | double8 __ovld __cnfn maxmag(double8 x, double8 y); | ||
| 1901 | double16 __ovld __cnfn maxmag(double16 x, double16 y); | ||
| 1902 | -#endif //cl_khr_fp64 | ||
| 1903 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1904 | #ifdef cl_khr_fp16 | ||
| 1905 | half __ovld __cnfn maxmag(half x, half y); | ||
| 1906 | half2 __ovld __cnfn maxmag(half2 x, half2 y); | ||
| 1907 | @@ -7931,14 +7937,14 @@ float3 __ovld __cnfn minmag(float3 x, float3 y); | ||
| 1908 | float4 __ovld __cnfn minmag(float4 x, float4 y); | ||
| 1909 | float8 __ovld __cnfn minmag(float8 x, float8 y); | ||
| 1910 | float16 __ovld __cnfn minmag(float16 x, float16 y); | ||
| 1911 | -#ifdef cl_khr_fp64 | ||
| 1912 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1913 | double __ovld __cnfn minmag(double x, double y); | ||
| 1914 | double2 __ovld __cnfn minmag(double2 x, double2 y); | ||
| 1915 | double3 __ovld __cnfn minmag(double3 x, double3 y); | ||
| 1916 | double4 __ovld __cnfn minmag(double4 x, double4 y); | ||
| 1917 | double8 __ovld __cnfn minmag(double8 x, double8 y); | ||
| 1918 | double16 __ovld __cnfn minmag(double16 x, double16 y); | ||
| 1919 | -#endif //cl_khr_fp64 | ||
| 1920 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1921 | #ifdef cl_khr_fp16 | ||
| 1922 | half __ovld __cnfn minmag(half x, half y); | ||
| 1923 | half2 __ovld __cnfn minmag(half2 x, half2 y); | ||
| 1924 | @@ -7955,21 +7961,21 @@ half16 __ovld __cnfn minmag(half16 x, half16 y); | ||
| 1925 | * the argument. It stores the integral part in the object | ||
| 1926 | * pointed to by iptr. | ||
| 1927 | */ | ||
| 1928 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1929 | +#ifdef __opencl_c_generic_address_space | ||
| 1930 | float __ovld modf(float x, float *iptr); | ||
| 1931 | float2 __ovld modf(float2 x, float2 *iptr); | ||
| 1932 | float3 __ovld modf(float3 x, float3 *iptr); | ||
| 1933 | float4 __ovld modf(float4 x, float4 *iptr); | ||
| 1934 | float8 __ovld modf(float8 x, float8 *iptr); | ||
| 1935 | float16 __ovld modf(float16 x, float16 *iptr); | ||
| 1936 | -#ifdef cl_khr_fp64 | ||
| 1937 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1938 | double __ovld modf(double x, double *iptr); | ||
| 1939 | double2 __ovld modf(double2 x, double2 *iptr); | ||
| 1940 | double3 __ovld modf(double3 x, double3 *iptr); | ||
| 1941 | double4 __ovld modf(double4 x, double4 *iptr); | ||
| 1942 | double8 __ovld modf(double8 x, double8 *iptr); | ||
| 1943 | double16 __ovld modf(double16 x, double16 *iptr); | ||
| 1944 | -#endif //cl_khr_fp64 | ||
| 1945 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1946 | #ifdef cl_khr_fp16 | ||
| 1947 | half __ovld modf(half x, half *iptr); | ||
| 1948 | half2 __ovld modf(half2 x, half2 *iptr); | ||
| 1949 | @@ -7978,7 +7984,9 @@ half4 __ovld modf(half4 x, half4 *iptr); | ||
| 1950 | half8 __ovld modf(half8 x, half8 *iptr); | ||
| 1951 | half16 __ovld modf(half16 x, half16 *iptr); | ||
| 1952 | #endif //cl_khr_fp16 | ||
| 1953 | -#else | ||
| 1954 | +#endif //__opencl_c_generic_address_space | ||
| 1955 | + | ||
| 1956 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1957 | float __ovld modf(float x, __global float *iptr); | ||
| 1958 | float2 __ovld modf(float2 x, __global float2 *iptr); | ||
| 1959 | float3 __ovld modf(float3 x, __global float3 *iptr); | ||
| 1960 | @@ -7997,7 +8005,7 @@ float3 __ovld modf(float3 x, __private float3 *iptr); | ||
| 1961 | float4 __ovld modf(float4 x, __private float4 *iptr); | ||
| 1962 | float8 __ovld modf(float8 x, __private float8 *iptr); | ||
| 1963 | float16 __ovld modf(float16 x, __private float16 *iptr); | ||
| 1964 | -#ifdef cl_khr_fp64 | ||
| 1965 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1966 | double __ovld modf(double x, __global double *iptr); | ||
| 1967 | double2 __ovld modf(double2 x, __global double2 *iptr); | ||
| 1968 | double3 __ovld modf(double3 x, __global double3 *iptr); | ||
| 1969 | @@ -8016,7 +8024,7 @@ double3 __ovld modf(double3 x, __private double3 *iptr); | ||
| 1970 | double4 __ovld modf(double4 x, __private double4 *iptr); | ||
| 1971 | double8 __ovld modf(double8 x, __private double8 *iptr); | ||
| 1972 | double16 __ovld modf(double16 x, __private double16 *iptr); | ||
| 1973 | -#endif //cl_khr_fp64 | ||
| 1974 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1975 | #ifdef cl_khr_fp16 | ||
| 1976 | half __ovld modf(half x, __global half *iptr); | ||
| 1977 | half2 __ovld modf(half2 x, __global half2 *iptr); | ||
| 1978 | @@ -8037,7 +8045,8 @@ half4 __ovld modf(half4 x, __private half4 *iptr); | ||
| 1979 | half8 __ovld modf(half8 x, __private half8 *iptr); | ||
| 1980 | half16 __ovld modf(half16 x, __private half16 *iptr); | ||
| 1981 | #endif //cl_khr_fp16 | ||
| 1982 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1983 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1984 | + //! CL_VERSION_2_0) | ||
| 1985 | |||
| 1986 | /** | ||
| 1987 | * Returns a quiet NaN. The nancode may be placed | ||
| 1988 | @@ -8049,14 +8058,14 @@ float3 __ovld __cnfn nan(uint3 nancode); | ||
| 1989 | float4 __ovld __cnfn nan(uint4 nancode); | ||
| 1990 | float8 __ovld __cnfn nan(uint8 nancode); | ||
| 1991 | float16 __ovld __cnfn nan(uint16 nancode); | ||
| 1992 | -#ifdef cl_khr_fp64 | ||
| 1993 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1994 | double __ovld __cnfn nan(ulong nancode); | ||
| 1995 | double2 __ovld __cnfn nan(ulong2 nancode); | ||
| 1996 | double3 __ovld __cnfn nan(ulong3 nancode); | ||
| 1997 | double4 __ovld __cnfn nan(ulong4 nancode); | ||
| 1998 | double8 __ovld __cnfn nan(ulong8 nancode); | ||
| 1999 | double16 __ovld __cnfn nan(ulong16 nancode); | ||
| 2000 | -#endif //cl_khr_fp64 | ||
| 2001 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2002 | #ifdef cl_khr_fp16 | ||
| 2003 | half __ovld __cnfn nan(ushort nancode); | ||
| 2004 | half2 __ovld __cnfn nan(ushort2 nancode); | ||
| 2005 | @@ -8079,14 +8088,14 @@ float3 __ovld __cnfn nextafter(float3 x, float3 y); | ||
| 2006 | float4 __ovld __cnfn nextafter(float4 x, float4 y); | ||
| 2007 | float8 __ovld __cnfn nextafter(float8 x, float8 y); | ||
| 2008 | float16 __ovld __cnfn nextafter(float16 x, float16 y); | ||
| 2009 | -#ifdef cl_khr_fp64 | ||
| 2010 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2011 | double __ovld __cnfn nextafter(double x, double y); | ||
| 2012 | double2 __ovld __cnfn nextafter(double2 x, double2 y); | ||
| 2013 | double3 __ovld __cnfn nextafter(double3 x, double3 y); | ||
| 2014 | double4 __ovld __cnfn nextafter(double4 x, double4 y); | ||
| 2015 | double8 __ovld __cnfn nextafter(double8 x, double8 y); | ||
| 2016 | double16 __ovld __cnfn nextafter(double16 x, double16 y); | ||
| 2017 | -#endif //cl_khr_fp64 | ||
| 2018 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2019 | #ifdef cl_khr_fp16 | ||
| 2020 | half __ovld __cnfn nextafter(half x, half y); | ||
| 2021 | half2 __ovld __cnfn nextafter(half2 x, half2 y); | ||
| 2022 | @@ -8105,14 +8114,14 @@ float3 __ovld __cnfn pow(float3 x, float3 y); | ||
| 2023 | float4 __ovld __cnfn pow(float4 x, float4 y); | ||
| 2024 | float8 __ovld __cnfn pow(float8 x, float8 y); | ||
| 2025 | float16 __ovld __cnfn pow(float16 x, float16 y); | ||
| 2026 | -#ifdef cl_khr_fp64 | ||
| 2027 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2028 | double __ovld __cnfn pow(double x, double y); | ||
| 2029 | double2 __ovld __cnfn pow(double2 x, double2 y); | ||
| 2030 | double3 __ovld __cnfn pow(double3 x, double3 y); | ||
| 2031 | double4 __ovld __cnfn pow(double4 x, double4 y); | ||
| 2032 | double8 __ovld __cnfn pow(double8 x, double8 y); | ||
| 2033 | double16 __ovld __cnfn pow(double16 x, double16 y); | ||
| 2034 | -#endif //cl_khr_fp64 | ||
| 2035 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2036 | #ifdef cl_khr_fp16 | ||
| 2037 | half __ovld __cnfn pow(half x, half y); | ||
| 2038 | half2 __ovld __cnfn pow(half2 x, half2 y); | ||
| 2039 | @@ -8131,14 +8140,14 @@ float3 __ovld __cnfn pown(float3 x, int3 y); | ||
| 2040 | float4 __ovld __cnfn pown(float4 x, int4 y); | ||
| 2041 | float8 __ovld __cnfn pown(float8 x, int8 y); | ||
| 2042 | float16 __ovld __cnfn pown(float16 x, int16 y); | ||
| 2043 | -#ifdef cl_khr_fp64 | ||
| 2044 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2045 | double __ovld __cnfn pown(double x, int y); | ||
| 2046 | double2 __ovld __cnfn pown(double2 x, int2 y); | ||
| 2047 | double3 __ovld __cnfn pown(double3 x, int3 y); | ||
| 2048 | double4 __ovld __cnfn pown(double4 x, int4 y); | ||
| 2049 | double8 __ovld __cnfn pown(double8 x, int8 y); | ||
| 2050 | double16 __ovld __cnfn pown(double16 x, int16 y); | ||
| 2051 | -#endif //cl_khr_fp64 | ||
| 2052 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2053 | #ifdef cl_khr_fp16 | ||
| 2054 | half __ovld __cnfn pown(half x, int y); | ||
| 2055 | half2 __ovld __cnfn pown(half2 x, int2 y); | ||
| 2056 | @@ -8157,14 +8166,14 @@ float3 __ovld __cnfn powr(float3 x, float3 y); | ||
| 2057 | float4 __ovld __cnfn powr(float4 x, float4 y); | ||
| 2058 | float8 __ovld __cnfn powr(float8 x, float8 y); | ||
| 2059 | float16 __ovld __cnfn powr(float16 x, float16 y); | ||
| 2060 | -#ifdef cl_khr_fp64 | ||
| 2061 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2062 | double __ovld __cnfn powr(double x, double y); | ||
| 2063 | double2 __ovld __cnfn powr(double2 x, double2 y); | ||
| 2064 | double3 __ovld __cnfn powr(double3 x, double3 y); | ||
| 2065 | double4 __ovld __cnfn powr(double4 x, double4 y); | ||
| 2066 | double8 __ovld __cnfn powr(double8 x, double8 y); | ||
| 2067 | double16 __ovld __cnfn powr(double16 x, double16 y); | ||
| 2068 | -#endif //cl_khr_fp64 | ||
| 2069 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2070 | #ifdef cl_khr_fp16 | ||
| 2071 | half __ovld __cnfn powr(half x, half y); | ||
| 2072 | half2 __ovld __cnfn powr(half2 x, half2 y); | ||
| 2073 | @@ -8186,14 +8195,14 @@ float3 __ovld __cnfn remainder(float3 x, float3 y); | ||
| 2074 | float4 __ovld __cnfn remainder(float4 x, float4 y); | ||
| 2075 | float8 __ovld __cnfn remainder(float8 x, float8 y); | ||
| 2076 | float16 __ovld __cnfn remainder(float16 x, float16 y); | ||
| 2077 | -#ifdef cl_khr_fp64 | ||
| 2078 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2079 | double __ovld __cnfn remainder(double x, double y); | ||
| 2080 | double2 __ovld __cnfn remainder(double2 x, double2 y); | ||
| 2081 | double3 __ovld __cnfn remainder(double3 x, double3 y); | ||
| 2082 | double4 __ovld __cnfn remainder(double4 x, double4 y); | ||
| 2083 | double8 __ovld __cnfn remainder(double8 x, double8 y); | ||
| 2084 | double16 __ovld __cnfn remainder(double16 x, double16 y); | ||
| 2085 | -#endif //cl_khr_fp64 | ||
| 2086 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2087 | #ifdef cl_khr_fp16 | ||
| 2088 | half __ovld __cnfn remainder(half x, half y); | ||
| 2089 | half2 __ovld __cnfn remainder(half2 x, half2 y); | ||
| 2090 | @@ -8215,21 +8224,21 @@ half16 __ovld __cnfn remainder(half16 x, half16 y); | ||
| 2091 | * sign as x/y. It stores this signed value in the object | ||
| 2092 | * pointed to by quo. | ||
| 2093 | */ | ||
| 2094 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2095 | +#ifdef __opencl_c_generic_address_space | ||
| 2096 | float __ovld remquo(float x, float y, int *quo); | ||
| 2097 | float2 __ovld remquo(float2 x, float2 y, int2 *quo); | ||
| 2098 | float3 __ovld remquo(float3 x, float3 y, int3 *quo); | ||
| 2099 | float4 __ovld remquo(float4 x, float4 y, int4 *quo); | ||
| 2100 | float8 __ovld remquo(float8 x, float8 y, int8 *quo); | ||
| 2101 | float16 __ovld remquo(float16 x, float16 y, int16 *quo); | ||
| 2102 | -#ifdef cl_khr_fp64 | ||
| 2103 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2104 | double __ovld remquo(double x, double y, int *quo); | ||
| 2105 | double2 __ovld remquo(double2 x, double2 y, int2 *quo); | ||
| 2106 | double3 __ovld remquo(double3 x, double3 y, int3 *quo); | ||
| 2107 | double4 __ovld remquo(double4 x, double4 y, int4 *quo); | ||
| 2108 | double8 __ovld remquo(double8 x, double8 y, int8 *quo); | ||
| 2109 | double16 __ovld remquo(double16 x, double16 y, int16 *quo); | ||
| 2110 | -#endif //cl_khr_fp64 | ||
| 2111 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2112 | #ifdef cl_khr_fp16 | ||
| 2113 | half __ovld remquo(half x, half y, int *quo); | ||
| 2114 | half2 __ovld remquo(half2 x, half2 y, int2 *quo); | ||
| 2115 | @@ -8237,9 +8246,10 @@ half3 __ovld remquo(half3 x, half3 y, int3 *quo); | ||
| 2116 | half4 __ovld remquo(half4 x, half4 y, int4 *quo); | ||
| 2117 | half8 __ovld remquo(half8 x, half8 y, int8 *quo); | ||
| 2118 | half16 __ovld remquo(half16 x, half16 y, int16 *quo); | ||
| 2119 | - | ||
| 2120 | #endif //cl_khr_fp16 | ||
| 2121 | -#else | ||
| 2122 | +#endif //__opencl_c_generic_address_space | ||
| 2123 | + | ||
| 2124 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 2125 | float __ovld remquo(float x, float y, __global int *quo); | ||
| 2126 | float2 __ovld remquo(float2 x, float2 y, __global int2 *quo); | ||
| 2127 | float3 __ovld remquo(float3 x, float3 y, __global int3 *quo); | ||
| 2128 | @@ -8258,7 +8268,7 @@ float3 __ovld remquo(float3 x, float3 y, __private int3 *quo); | ||
| 2129 | float4 __ovld remquo(float4 x, float4 y, __private int4 *quo); | ||
| 2130 | float8 __ovld remquo(float8 x, float8 y, __private int8 *quo); | ||
| 2131 | float16 __ovld remquo(float16 x, float16 y, __private int16 *quo); | ||
| 2132 | -#ifdef cl_khr_fp64 | ||
| 2133 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2134 | double __ovld remquo(double x, double y, __global int *quo); | ||
| 2135 | double2 __ovld remquo(double2 x, double2 y, __global int2 *quo); | ||
| 2136 | double3 __ovld remquo(double3 x, double3 y, __global int3 *quo); | ||
| 2137 | @@ -8277,7 +8287,7 @@ double3 __ovld remquo(double3 x, double3 y, __private int3 *quo); | ||
| 2138 | double4 __ovld remquo(double4 x, double4 y, __private int4 *quo); | ||
| 2139 | double8 __ovld remquo(double8 x, double8 y, __private int8 *quo); | ||
| 2140 | double16 __ovld remquo(double16 x, double16 y, __private int16 *quo); | ||
| 2141 | -#endif //cl_khr_fp64 | ||
| 2142 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2143 | #ifdef cl_khr_fp16 | ||
| 2144 | half __ovld remquo(half x, half y, __global int *quo); | ||
| 2145 | half2 __ovld remquo(half2 x, half2 y, __global int2 *quo); | ||
| 2146 | @@ -8298,7 +8308,8 @@ half4 __ovld remquo(half4 x, half4 y, __private int4 *quo); | ||
| 2147 | half8 __ovld remquo(half8 x, half8 y, __private int8 *quo); | ||
| 2148 | half16 __ovld remquo(half16 x, half16 y, __private int16 *quo); | ||
| 2149 | #endif //cl_khr_fp16 | ||
| 2150 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2151 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 2152 | + //! CL_VERSION_2_0) | ||
| 2153 | /** | ||
| 2154 | * Round to integral value (using round to nearest | ||
| 2155 | * even rounding mode) in floating-point format. | ||
| 2156 | @@ -8311,14 +8322,14 @@ float3 __ovld __cnfn rint(float3); | ||
| 2157 | float4 __ovld __cnfn rint(float4); | ||
| 2158 | float8 __ovld __cnfn rint(float8); | ||
| 2159 | float16 __ovld __cnfn rint(float16); | ||
| 2160 | -#ifdef cl_khr_fp64 | ||
| 2161 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2162 | double __ovld __cnfn rint(double); | ||
| 2163 | double2 __ovld __cnfn rint(double2); | ||
| 2164 | double3 __ovld __cnfn rint(double3); | ||
| 2165 | double4 __ovld __cnfn rint(double4); | ||
| 2166 | double8 __ovld __cnfn rint(double8); | ||
| 2167 | double16 __ovld __cnfn rint(double16); | ||
| 2168 | -#endif //cl_khr_fp64 | ||
| 2169 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2170 | #ifdef cl_khr_fp16 | ||
| 2171 | half __ovld __cnfn rint(half); | ||
| 2172 | half2 __ovld __cnfn rint(half2); | ||
| 2173 | @@ -8337,14 +8348,14 @@ float3 __ovld __cnfn rootn(float3 x, int3 y); | ||
| 2174 | float4 __ovld __cnfn rootn(float4 x, int4 y); | ||
| 2175 | float8 __ovld __cnfn rootn(float8 x, int8 y); | ||
| 2176 | float16 __ovld __cnfn rootn(float16 x, int16 y); | ||
| 2177 | -#ifdef cl_khr_fp64 | ||
| 2178 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2179 | double __ovld __cnfn rootn(double x, int y); | ||
| 2180 | double2 __ovld __cnfn rootn(double2 x, int2 y); | ||
| 2181 | double3 __ovld __cnfn rootn(double3 x, int3 y); | ||
| 2182 | double4 __ovld __cnfn rootn(double4 x, int4 y); | ||
| 2183 | double8 __ovld __cnfn rootn(double8 x, int8 y); | ||
| 2184 | double16 __ovld __cnfn rootn(double16 x, int16 y); | ||
| 2185 | -#endif //cl_khr_fp64 | ||
| 2186 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2187 | #ifdef cl_khr_fp16 | ||
| 2188 | half __ovld __cnfn rootn(half x, int y); | ||
| 2189 | half2 __ovld __cnfn rootn(half2 x, int2 y); | ||
| 2190 | @@ -8365,14 +8376,14 @@ float3 __ovld __cnfn round(float3 x); | ||
| 2191 | float4 __ovld __cnfn round(float4 x); | ||
| 2192 | float8 __ovld __cnfn round(float8 x); | ||
| 2193 | float16 __ovld __cnfn round(float16 x); | ||
| 2194 | -#ifdef cl_khr_fp64 | ||
| 2195 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2196 | double __ovld __cnfn round(double x); | ||
| 2197 | double2 __ovld __cnfn round(double2 x); | ||
| 2198 | double3 __ovld __cnfn round(double3 x); | ||
| 2199 | double4 __ovld __cnfn round(double4 x); | ||
| 2200 | double8 __ovld __cnfn round(double8 x); | ||
| 2201 | double16 __ovld __cnfn round(double16 x); | ||
| 2202 | -#endif //cl_khr_fp64 | ||
| 2203 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2204 | #ifdef cl_khr_fp16 | ||
| 2205 | half __ovld __cnfn round(half x); | ||
| 2206 | half2 __ovld __cnfn round(half2 x); | ||
| 2207 | @@ -8391,14 +8402,14 @@ float3 __ovld __cnfn rsqrt(float3); | ||
| 2208 | float4 __ovld __cnfn rsqrt(float4); | ||
| 2209 | float8 __ovld __cnfn rsqrt(float8); | ||
| 2210 | float16 __ovld __cnfn rsqrt(float16); | ||
| 2211 | -#ifdef cl_khr_fp64 | ||
| 2212 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2213 | double __ovld __cnfn rsqrt(double); | ||
| 2214 | double2 __ovld __cnfn rsqrt(double2); | ||
| 2215 | double3 __ovld __cnfn rsqrt(double3); | ||
| 2216 | double4 __ovld __cnfn rsqrt(double4); | ||
| 2217 | double8 __ovld __cnfn rsqrt(double8); | ||
| 2218 | double16 __ovld __cnfn rsqrt(double16); | ||
| 2219 | -#endif //cl_khr_fp64 | ||
| 2220 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2221 | #ifdef cl_khr_fp16 | ||
| 2222 | half __ovld __cnfn rsqrt(half); | ||
| 2223 | half2 __ovld __cnfn rsqrt(half2); | ||
| 2224 | @@ -8417,14 +8428,14 @@ float3 __ovld __cnfn sin(float3); | ||
| 2225 | float4 __ovld __cnfn sin(float4); | ||
| 2226 | float8 __ovld __cnfn sin(float8); | ||
| 2227 | float16 __ovld __cnfn sin(float16); | ||
| 2228 | -#ifdef cl_khr_fp64 | ||
| 2229 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2230 | double __ovld __cnfn sin(double); | ||
| 2231 | double2 __ovld __cnfn sin(double2); | ||
| 2232 | double3 __ovld __cnfn sin(double3); | ||
| 2233 | double4 __ovld __cnfn sin(double4); | ||
| 2234 | double8 __ovld __cnfn sin(double8); | ||
| 2235 | double16 __ovld __cnfn sin(double16); | ||
| 2236 | -#endif //cl_khr_fp64 | ||
| 2237 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2238 | #ifdef cl_khr_fp16 | ||
| 2239 | half __ovld __cnfn sin(half); | ||
| 2240 | half2 __ovld __cnfn sin(half2); | ||
| 2241 | @@ -8439,21 +8450,21 @@ half16 __ovld __cnfn sin(half16); | ||
| 2242 | * is the return value and computed cosine is returned | ||
| 2243 | * in cosval. | ||
| 2244 | */ | ||
| 2245 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2246 | +#ifdef __opencl_c_generic_address_space | ||
| 2247 | float __ovld sincos(float x, float *cosval); | ||
| 2248 | float2 __ovld sincos(float2 x, float2 *cosval); | ||
| 2249 | float3 __ovld sincos(float3 x, float3 *cosval); | ||
| 2250 | float4 __ovld sincos(float4 x, float4 *cosval); | ||
| 2251 | float8 __ovld sincos(float8 x, float8 *cosval); | ||
| 2252 | float16 __ovld sincos(float16 x, float16 *cosval); | ||
| 2253 | -#ifdef cl_khr_fp64 | ||
| 2254 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2255 | double __ovld sincos(double x, double *cosval); | ||
| 2256 | double2 __ovld sincos(double2 x, double2 *cosval); | ||
| 2257 | double3 __ovld sincos(double3 x, double3 *cosval); | ||
| 2258 | double4 __ovld sincos(double4 x, double4 *cosval); | ||
| 2259 | double8 __ovld sincos(double8 x, double8 *cosval); | ||
| 2260 | double16 __ovld sincos(double16 x, double16 *cosval); | ||
| 2261 | -#endif //cl_khr_fp64 | ||
| 2262 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2263 | #ifdef cl_khr_fp16 | ||
| 2264 | half __ovld sincos(half x, half *cosval); | ||
| 2265 | half2 __ovld sincos(half2 x, half2 *cosval); | ||
| 2266 | @@ -8462,7 +8473,9 @@ half4 __ovld sincos(half4 x, half4 *cosval); | ||
| 2267 | half8 __ovld sincos(half8 x, half8 *cosval); | ||
| 2268 | half16 __ovld sincos(half16 x, half16 *cosval); | ||
| 2269 | #endif //cl_khr_fp16 | ||
| 2270 | -#else | ||
| 2271 | +#endif //__opencl_c_generic_address_space | ||
| 2272 | + | ||
| 2273 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 2274 | float __ovld sincos(float x, __global float *cosval); | ||
| 2275 | float2 __ovld sincos(float2 x, __global float2 *cosval); | ||
| 2276 | float3 __ovld sincos(float3 x, __global float3 *cosval); | ||
| 2277 | @@ -8481,7 +8494,7 @@ float3 __ovld sincos(float3 x, __private float3 *cosval); | ||
| 2278 | float4 __ovld sincos(float4 x, __private float4 *cosval); | ||
| 2279 | float8 __ovld sincos(float8 x, __private float8 *cosval); | ||
| 2280 | float16 __ovld sincos(float16 x, __private float16 *cosval); | ||
| 2281 | -#ifdef cl_khr_fp64 | ||
| 2282 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2283 | double __ovld sincos(double x, __global double *cosval); | ||
| 2284 | double2 __ovld sincos(double2 x, __global double2 *cosval); | ||
| 2285 | double3 __ovld sincos(double3 x, __global double3 *cosval); | ||
| 2286 | @@ -8500,7 +8513,7 @@ double3 __ovld sincos(double3 x, __private double3 *cosval); | ||
| 2287 | double4 __ovld sincos(double4 x, __private double4 *cosval); | ||
| 2288 | double8 __ovld sincos(double8 x, __private double8 *cosval); | ||
| 2289 | double16 __ovld sincos(double16 x, __private double16 *cosval); | ||
| 2290 | -#endif //cl_khr_fp64 | ||
| 2291 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2292 | #ifdef cl_khr_fp16 | ||
| 2293 | half __ovld sincos(half x, __global half *cosval); | ||
| 2294 | half2 __ovld sincos(half2 x, __global half2 *cosval); | ||
| 2295 | @@ -8521,8 +8534,8 @@ half4 __ovld sincos(half4 x, __private half4 *cosval); | ||
| 2296 | half8 __ovld sincos(half8 x, __private half8 *cosval); | ||
| 2297 | half16 __ovld sincos(half16 x, __private half16 *cosval); | ||
| 2298 | #endif //cl_khr_fp16 | ||
| 2299 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2300 | - | ||
| 2301 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 2302 | + //! CL_VERSION_2_0) | ||
| 2303 | /** | ||
| 2304 | * Compute hyperbolic sine. | ||
| 2305 | */ | ||
| 2306 | @@ -8532,14 +8545,14 @@ float3 __ovld __cnfn sinh(float3); | ||
| 2307 | float4 __ovld __cnfn sinh(float4); | ||
| 2308 | float8 __ovld __cnfn sinh(float8); | ||
| 2309 | float16 __ovld __cnfn sinh(float16); | ||
| 2310 | -#ifdef cl_khr_fp64 | ||
| 2311 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2312 | double __ovld __cnfn sinh(double); | ||
| 2313 | double2 __ovld __cnfn sinh(double2); | ||
| 2314 | double3 __ovld __cnfn sinh(double3); | ||
| 2315 | double4 __ovld __cnfn sinh(double4); | ||
| 2316 | double8 __ovld __cnfn sinh(double8); | ||
| 2317 | double16 __ovld __cnfn sinh(double16); | ||
| 2318 | -#endif //cl_khr_fp64 | ||
| 2319 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2320 | #ifdef cl_khr_fp16 | ||
| 2321 | half __ovld __cnfn sinh(half); | ||
| 2322 | half2 __ovld __cnfn sinh(half2); | ||
| 2323 | @@ -8558,14 +8571,14 @@ float3 __ovld __cnfn sinpi(float3 x); | ||
| 2324 | float4 __ovld __cnfn sinpi(float4 x); | ||
| 2325 | float8 __ovld __cnfn sinpi(float8 x); | ||
| 2326 | float16 __ovld __cnfn sinpi(float16 x); | ||
| 2327 | -#ifdef cl_khr_fp64 | ||
| 2328 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2329 | double __ovld __cnfn sinpi(double x); | ||
| 2330 | double2 __ovld __cnfn sinpi(double2 x); | ||
| 2331 | double3 __ovld __cnfn sinpi(double3 x); | ||
| 2332 | double4 __ovld __cnfn sinpi(double4 x); | ||
| 2333 | double8 __ovld __cnfn sinpi(double8 x); | ||
| 2334 | double16 __ovld __cnfn sinpi(double16 x); | ||
| 2335 | -#endif //cl_khr_fp64 | ||
| 2336 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2337 | #ifdef cl_khr_fp16 | ||
| 2338 | half __ovld __cnfn sinpi(half x); | ||
| 2339 | half2 __ovld __cnfn sinpi(half2 x); | ||
| 2340 | @@ -8584,14 +8597,14 @@ float3 __ovld __cnfn sqrt(float3); | ||
| 2341 | float4 __ovld __cnfn sqrt(float4); | ||
| 2342 | float8 __ovld __cnfn sqrt(float8); | ||
| 2343 | float16 __ovld __cnfn sqrt(float16); | ||
| 2344 | -#ifdef cl_khr_fp64 | ||
| 2345 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2346 | double __ovld __cnfn sqrt(double); | ||
| 2347 | double2 __ovld __cnfn sqrt(double2); | ||
| 2348 | double3 __ovld __cnfn sqrt(double3); | ||
| 2349 | double4 __ovld __cnfn sqrt(double4); | ||
| 2350 | double8 __ovld __cnfn sqrt(double8); | ||
| 2351 | double16 __ovld __cnfn sqrt(double16); | ||
| 2352 | -#endif //cl_khr_fp64 | ||
| 2353 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2354 | #ifdef cl_khr_fp16 | ||
| 2355 | half __ovld __cnfn sqrt(half); | ||
| 2356 | half2 __ovld __cnfn sqrt(half2); | ||
| 2357 | @@ -8610,14 +8623,14 @@ float3 __ovld __cnfn tan(float3); | ||
| 2358 | float4 __ovld __cnfn tan(float4); | ||
| 2359 | float8 __ovld __cnfn tan(float8); | ||
| 2360 | float16 __ovld __cnfn tan(float16); | ||
| 2361 | -#ifdef cl_khr_fp64 | ||
| 2362 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2363 | double __ovld __cnfn tan(double); | ||
| 2364 | double2 __ovld __cnfn tan(double2); | ||
| 2365 | double3 __ovld __cnfn tan(double3); | ||
| 2366 | double4 __ovld __cnfn tan(double4); | ||
| 2367 | double8 __ovld __cnfn tan(double8); | ||
| 2368 | double16 __ovld __cnfn tan(double16); | ||
| 2369 | -#endif //cl_khr_fp64 | ||
| 2370 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2371 | #ifdef cl_khr_fp16 | ||
| 2372 | half __ovld __cnfn tan(half); | ||
| 2373 | half2 __ovld __cnfn tan(half2); | ||
| 2374 | @@ -8636,14 +8649,14 @@ float3 __ovld __cnfn tanh(float3); | ||
| 2375 | float4 __ovld __cnfn tanh(float4); | ||
| 2376 | float8 __ovld __cnfn tanh(float8); | ||
| 2377 | float16 __ovld __cnfn tanh(float16); | ||
| 2378 | -#ifdef cl_khr_fp64 | ||
| 2379 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2380 | double __ovld __cnfn tanh(double); | ||
| 2381 | double2 __ovld __cnfn tanh(double2); | ||
| 2382 | double3 __ovld __cnfn tanh(double3); | ||
| 2383 | double4 __ovld __cnfn tanh(double4); | ||
| 2384 | double8 __ovld __cnfn tanh(double8); | ||
| 2385 | double16 __ovld __cnfn tanh(double16); | ||
| 2386 | -#endif //cl_khr_fp64 | ||
| 2387 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2388 | #ifdef cl_khr_fp16 | ||
| 2389 | half __ovld __cnfn tanh(half); | ||
| 2390 | half2 __ovld __cnfn tanh(half2); | ||
| 2391 | @@ -8662,14 +8675,14 @@ float3 __ovld __cnfn tanpi(float3 x); | ||
| 2392 | float4 __ovld __cnfn tanpi(float4 x); | ||
| 2393 | float8 __ovld __cnfn tanpi(float8 x); | ||
| 2394 | float16 __ovld __cnfn tanpi(float16 x); | ||
| 2395 | -#ifdef cl_khr_fp64 | ||
| 2396 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2397 | double __ovld __cnfn tanpi(double x); | ||
| 2398 | double2 __ovld __cnfn tanpi(double2 x); | ||
| 2399 | double3 __ovld __cnfn tanpi(double3 x); | ||
| 2400 | double4 __ovld __cnfn tanpi(double4 x); | ||
| 2401 | double8 __ovld __cnfn tanpi(double8 x); | ||
| 2402 | double16 __ovld __cnfn tanpi(double16 x); | ||
| 2403 | -#endif //cl_khr_fp64 | ||
| 2404 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2405 | #ifdef cl_khr_fp16 | ||
| 2406 | half __ovld __cnfn tanpi(half x); | ||
| 2407 | half2 __ovld __cnfn tanpi(half2 x); | ||
| 2408 | @@ -8688,14 +8701,14 @@ float3 __ovld __cnfn tgamma(float3); | ||
| 2409 | float4 __ovld __cnfn tgamma(float4); | ||
| 2410 | float8 __ovld __cnfn tgamma(float8); | ||
| 2411 | float16 __ovld __cnfn tgamma(float16); | ||
| 2412 | -#ifdef cl_khr_fp64 | ||
| 2413 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2414 | double __ovld __cnfn tgamma(double); | ||
| 2415 | double2 __ovld __cnfn tgamma(double2); | ||
| 2416 | double3 __ovld __cnfn tgamma(double3); | ||
| 2417 | double4 __ovld __cnfn tgamma(double4); | ||
| 2418 | double8 __ovld __cnfn tgamma(double8); | ||
| 2419 | double16 __ovld __cnfn tgamma(double16); | ||
| 2420 | -#endif //cl_khr_fp64 | ||
| 2421 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2422 | #ifdef cl_khr_fp16 | ||
| 2423 | half __ovld __cnfn tgamma(half); | ||
| 2424 | half2 __ovld __cnfn tgamma(half2); | ||
| 2425 | @@ -8715,14 +8728,14 @@ float3 __ovld __cnfn trunc(float3); | ||
| 2426 | float4 __ovld __cnfn trunc(float4); | ||
| 2427 | float8 __ovld __cnfn trunc(float8); | ||
| 2428 | float16 __ovld __cnfn trunc(float16); | ||
| 2429 | -#ifdef cl_khr_fp64 | ||
| 2430 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2431 | double __ovld __cnfn trunc(double); | ||
| 2432 | double2 __ovld __cnfn trunc(double2); | ||
| 2433 | double3 __ovld __cnfn trunc(double3); | ||
| 2434 | double4 __ovld __cnfn trunc(double4); | ||
| 2435 | double8 __ovld __cnfn trunc(double8); | ||
| 2436 | double16 __ovld __cnfn trunc(double16); | ||
| 2437 | -#endif //cl_khr_fp64 | ||
| 2438 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2439 | #ifdef cl_khr_fp16 | ||
| 2440 | half __ovld __cnfn trunc(half); | ||
| 2441 | half2 __ovld __cnfn trunc(half2); | ||
| 2442 | @@ -10108,7 +10121,7 @@ float3 __ovld __cnfn clamp(float3 x, float minval, float maxval); | ||
| 2443 | float4 __ovld __cnfn clamp(float4 x, float minval, float maxval); | ||
| 2444 | float8 __ovld __cnfn clamp(float8 x, float minval, float maxval); | ||
| 2445 | float16 __ovld __cnfn clamp(float16 x, float minval, float maxval); | ||
| 2446 | -#ifdef cl_khr_fp64 | ||
| 2447 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2448 | double __ovld __cnfn clamp(double x, double minval, double maxval); | ||
| 2449 | double2 __ovld __cnfn clamp(double2 x, double2 minval, double2 maxval); | ||
| 2450 | double3 __ovld __cnfn clamp(double3 x, double3 minval, double3 maxval); | ||
| 2451 | @@ -10120,7 +10133,7 @@ double3 __ovld __cnfn clamp(double3 x, double minval, double maxval); | ||
| 2452 | double4 __ovld __cnfn clamp(double4 x, double minval, double maxval); | ||
| 2453 | double8 __ovld __cnfn clamp(double8 x, double minval, double maxval); | ||
| 2454 | double16 __ovld __cnfn clamp(double16 x, double minval, double maxval); | ||
| 2455 | -#endif //cl_khr_fp64 | ||
| 2456 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2457 | #ifdef cl_khr_fp16 | ||
| 2458 | half __ovld __cnfn clamp(half x, half minval, half maxval); | ||
| 2459 | half2 __ovld __cnfn clamp(half2 x, half2 minval, half2 maxval); | ||
| 2460 | @@ -10145,14 +10158,14 @@ float3 __ovld __cnfn degrees(float3 radians); | ||
| 2461 | float4 __ovld __cnfn degrees(float4 radians); | ||
| 2462 | float8 __ovld __cnfn degrees(float8 radians); | ||
| 2463 | float16 __ovld __cnfn degrees(float16 radians); | ||
| 2464 | -#ifdef cl_khr_fp64 | ||
| 2465 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2466 | double __ovld __cnfn degrees(double radians); | ||
| 2467 | double2 __ovld __cnfn degrees(double2 radians); | ||
| 2468 | double3 __ovld __cnfn degrees(double3 radians); | ||
| 2469 | double4 __ovld __cnfn degrees(double4 radians); | ||
| 2470 | double8 __ovld __cnfn degrees(double8 radians); | ||
| 2471 | double16 __ovld __cnfn degrees(double16 radians); | ||
| 2472 | -#endif //cl_khr_fp64 | ||
| 2473 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2474 | #ifdef cl_khr_fp16 | ||
| 2475 | half __ovld __cnfn degrees(half radians); | ||
| 2476 | half2 __ovld __cnfn degrees(half2 radians); | ||
| 2477 | @@ -10177,7 +10190,7 @@ float3 __ovld __cnfn max(float3 x, float y); | ||
| 2478 | float4 __ovld __cnfn max(float4 x, float y); | ||
| 2479 | float8 __ovld __cnfn max(float8 x, float y); | ||
| 2480 | float16 __ovld __cnfn max(float16 x, float y); | ||
| 2481 | -#ifdef cl_khr_fp64 | ||
| 2482 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2483 | double __ovld __cnfn max(double x, double y); | ||
| 2484 | double2 __ovld __cnfn max(double2 x, double2 y); | ||
| 2485 | double3 __ovld __cnfn max(double3 x, double3 y); | ||
| 2486 | @@ -10189,7 +10202,7 @@ double3 __ovld __cnfn max(double3 x, double y); | ||
| 2487 | double4 __ovld __cnfn max(double4 x, double y); | ||
| 2488 | double8 __ovld __cnfn max(double8 x, double y); | ||
| 2489 | double16 __ovld __cnfn max(double16 x, double y); | ||
| 2490 | -#endif //cl_khr_fp64 | ||
| 2491 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2492 | #ifdef cl_khr_fp16 | ||
| 2493 | half __ovld __cnfn max(half x, half y); | ||
| 2494 | half2 __ovld __cnfn max(half2 x, half2 y); | ||
| 2495 | @@ -10219,7 +10232,7 @@ float3 __ovld __cnfn min(float3 x, float y); | ||
| 2496 | float4 __ovld __cnfn min(float4 x, float y); | ||
| 2497 | float8 __ovld __cnfn min(float8 x, float y); | ||
| 2498 | float16 __ovld __cnfn min(float16 x, float y); | ||
| 2499 | -#ifdef cl_khr_fp64 | ||
| 2500 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2501 | double __ovld __cnfn min(double x, double y); | ||
| 2502 | double2 __ovld __cnfn min(double2 x, double2 y); | ||
| 2503 | double3 __ovld __cnfn min(double3 x, double3 y); | ||
| 2504 | @@ -10231,7 +10244,7 @@ double3 __ovld __cnfn min(double3 x, double y); | ||
| 2505 | double4 __ovld __cnfn min(double4 x, double y); | ||
| 2506 | double8 __ovld __cnfn min(double8 x, double y); | ||
| 2507 | double16 __ovld __cnfn min(double16 x, double y); | ||
| 2508 | -#endif //cl_khr_fp64 | ||
| 2509 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2510 | #ifdef cl_khr_fp16 | ||
| 2511 | half __ovld __cnfn min(half x, half y); | ||
| 2512 | half2 __ovld __cnfn min(half2 x, half2 y); | ||
| 2513 | @@ -10264,7 +10277,7 @@ float3 __ovld __cnfn mix(float3 x, float3 y, float a); | ||
| 2514 | float4 __ovld __cnfn mix(float4 x, float4 y, float a); | ||
| 2515 | float8 __ovld __cnfn mix(float8 x, float8 y, float a); | ||
| 2516 | float16 __ovld __cnfn mix(float16 x, float16 y, float a); | ||
| 2517 | -#ifdef cl_khr_fp64 | ||
| 2518 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2519 | double __ovld __cnfn mix(double x, double y, double a); | ||
| 2520 | double2 __ovld __cnfn mix(double2 x, double2 y, double2 a); | ||
| 2521 | double3 __ovld __cnfn mix(double3 x, double3 y, double3 a); | ||
| 2522 | @@ -10276,7 +10289,7 @@ double3 __ovld __cnfn mix(double3 x, double3 y, double a); | ||
| 2523 | double4 __ovld __cnfn mix(double4 x, double4 y, double a); | ||
| 2524 | double8 __ovld __cnfn mix(double8 x, double8 y, double a); | ||
| 2525 | double16 __ovld __cnfn mix(double16 x, double16 y, double a); | ||
| 2526 | -#endif //cl_khr_fp64 | ||
| 2527 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2528 | #ifdef cl_khr_fp16 | ||
| 2529 | half __ovld __cnfn mix(half x, half y, half a); | ||
| 2530 | half2 __ovld __cnfn mix(half2 x, half2 y, half2 a); | ||
| 2531 | @@ -10301,14 +10314,14 @@ float3 __ovld __cnfn radians(float3 degrees); | ||
| 2532 | float4 __ovld __cnfn radians(float4 degrees); | ||
| 2533 | float8 __ovld __cnfn radians(float8 degrees); | ||
| 2534 | float16 __ovld __cnfn radians(float16 degrees); | ||
| 2535 | -#ifdef cl_khr_fp64 | ||
| 2536 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2537 | double __ovld __cnfn radians(double degrees); | ||
| 2538 | double2 __ovld __cnfn radians(double2 degrees); | ||
| 2539 | double3 __ovld __cnfn radians(double3 degrees); | ||
| 2540 | double4 __ovld __cnfn radians(double4 degrees); | ||
| 2541 | double8 __ovld __cnfn radians(double8 degrees); | ||
| 2542 | double16 __ovld __cnfn radians(double16 degrees); | ||
| 2543 | -#endif //cl_khr_fp64 | ||
| 2544 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2545 | #ifdef cl_khr_fp16 | ||
| 2546 | half __ovld __cnfn radians(half degrees); | ||
| 2547 | half2 __ovld __cnfn radians(half2 degrees); | ||
| 2548 | @@ -10332,7 +10345,7 @@ float3 __ovld __cnfn step(float edge, float3 x); | ||
| 2549 | float4 __ovld __cnfn step(float edge, float4 x); | ||
| 2550 | float8 __ovld __cnfn step(float edge, float8 x); | ||
| 2551 | float16 __ovld __cnfn step(float edge, float16 x); | ||
| 2552 | -#ifdef cl_khr_fp64 | ||
| 2553 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2554 | double __ovld __cnfn step(double edge, double x); | ||
| 2555 | double2 __ovld __cnfn step(double2 edge, double2 x); | ||
| 2556 | double3 __ovld __cnfn step(double3 edge, double3 x); | ||
| 2557 | @@ -10344,7 +10357,7 @@ double3 __ovld __cnfn step(double edge, double3 x); | ||
| 2558 | double4 __ovld __cnfn step(double edge, double4 x); | ||
| 2559 | double8 __ovld __cnfn step(double edge, double8 x); | ||
| 2560 | double16 __ovld __cnfn step(double edge, double16 x); | ||
| 2561 | -#endif //cl_khr_fp64 | ||
| 2562 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2563 | #ifdef cl_khr_fp16 | ||
| 2564 | half __ovld __cnfn step(half edge, half x); | ||
| 2565 | half2 __ovld __cnfn step(half2 edge, half2 x); | ||
| 2566 | @@ -10383,7 +10396,7 @@ float3 __ovld __cnfn smoothstep(float edge0, float edge1, float3 x); | ||
| 2567 | float4 __ovld __cnfn smoothstep(float edge0, float edge1, float4 x); | ||
| 2568 | float8 __ovld __cnfn smoothstep(float edge0, float edge1, float8 x); | ||
| 2569 | float16 __ovld __cnfn smoothstep(float edge0, float edge1, float16 x); | ||
| 2570 | -#ifdef cl_khr_fp64 | ||
| 2571 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2572 | double __ovld __cnfn smoothstep(double edge0, double edge1, double x); | ||
| 2573 | double2 __ovld __cnfn smoothstep(double2 edge0, double2 edge1, double2 x); | ||
| 2574 | double3 __ovld __cnfn smoothstep(double3 edge0, double3 edge1, double3 x); | ||
| 2575 | @@ -10395,7 +10408,7 @@ double3 __ovld __cnfn smoothstep(double edge0, double edge1, double3 x); | ||
| 2576 | double4 __ovld __cnfn smoothstep(double edge0, double edge1, double4 x); | ||
| 2577 | double8 __ovld __cnfn smoothstep(double edge0, double edge1, double8 x); | ||
| 2578 | double16 __ovld __cnfn smoothstep(double edge0, double edge1, double16 x); | ||
| 2579 | -#endif //cl_khr_fp64 | ||
| 2580 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2581 | #ifdef cl_khr_fp16 | ||
| 2582 | half __ovld __cnfn smoothstep(half edge0, half edge1, half x); | ||
| 2583 | half2 __ovld __cnfn smoothstep(half2 edge0, half2 edge1, half2 x); | ||
| 2584 | @@ -10420,14 +10433,14 @@ float3 __ovld __cnfn sign(float3 x); | ||
| 2585 | float4 __ovld __cnfn sign(float4 x); | ||
| 2586 | float8 __ovld __cnfn sign(float8 x); | ||
| 2587 | float16 __ovld __cnfn sign(float16 x); | ||
| 2588 | -#ifdef cl_khr_fp64 | ||
| 2589 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2590 | double __ovld __cnfn sign(double x); | ||
| 2591 | double2 __ovld __cnfn sign(double2 x); | ||
| 2592 | double3 __ovld __cnfn sign(double3 x); | ||
| 2593 | double4 __ovld __cnfn sign(double4 x); | ||
| 2594 | double8 __ovld __cnfn sign(double8 x); | ||
| 2595 | double16 __ovld __cnfn sign(double16 x); | ||
| 2596 | -#endif //cl_khr_fp64 | ||
| 2597 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2598 | #ifdef cl_khr_fp16 | ||
| 2599 | half __ovld __cnfn sign(half x); | ||
| 2600 | half2 __ovld __cnfn sign(half2 x); | ||
| 2601 | @@ -10445,10 +10458,10 @@ half16 __ovld __cnfn sign(half16 x); | ||
| 2602 | */ | ||
| 2603 | float4 __ovld __cnfn cross(float4 p0, float4 p1); | ||
| 2604 | float3 __ovld __cnfn cross(float3 p0, float3 p1); | ||
| 2605 | -#ifdef cl_khr_fp64 | ||
| 2606 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2607 | double4 __ovld __cnfn cross(double4 p0, double4 p1); | ||
| 2608 | double3 __ovld __cnfn cross(double3 p0, double3 p1); | ||
| 2609 | -#endif //cl_khr_fp64 | ||
| 2610 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2611 | #ifdef cl_khr_fp16 | ||
| 2612 | half4 __ovld __cnfn cross(half4 p0, half4 p1); | ||
| 2613 | half3 __ovld __cnfn cross(half3 p0, half3 p1); | ||
| 2614 | @@ -10461,12 +10474,12 @@ float __ovld __cnfn dot(float p0, float p1); | ||
| 2615 | float __ovld __cnfn dot(float2 p0, float2 p1); | ||
| 2616 | float __ovld __cnfn dot(float3 p0, float3 p1); | ||
| 2617 | float __ovld __cnfn dot(float4 p0, float4 p1); | ||
| 2618 | -#ifdef cl_khr_fp64 | ||
| 2619 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2620 | double __ovld __cnfn dot(double p0, double p1); | ||
| 2621 | double __ovld __cnfn dot(double2 p0, double2 p1); | ||
| 2622 | double __ovld __cnfn dot(double3 p0, double3 p1); | ||
| 2623 | double __ovld __cnfn dot(double4 p0, double4 p1); | ||
| 2624 | -#endif //cl_khr_fp64 | ||
| 2625 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2626 | #ifdef cl_khr_fp16 | ||
| 2627 | half __ovld __cnfn dot(half p0, half p1); | ||
| 2628 | half __ovld __cnfn dot(half2 p0, half2 p1); | ||
| 2629 | @@ -10482,12 +10495,12 @@ float __ovld __cnfn distance(float p0, float p1); | ||
| 2630 | float __ovld __cnfn distance(float2 p0, float2 p1); | ||
| 2631 | float __ovld __cnfn distance(float3 p0, float3 p1); | ||
| 2632 | float __ovld __cnfn distance(float4 p0, float4 p1); | ||
| 2633 | -#ifdef cl_khr_fp64 | ||
| 2634 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2635 | double __ovld __cnfn distance(double p0, double p1); | ||
| 2636 | double __ovld __cnfn distance(double2 p0, double2 p1); | ||
| 2637 | double __ovld __cnfn distance(double3 p0, double3 p1); | ||
| 2638 | double __ovld __cnfn distance(double4 p0, double4 p1); | ||
| 2639 | -#endif //cl_khr_fp64 | ||
| 2640 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2641 | #ifdef cl_khr_fp16 | ||
| 2642 | half __ovld __cnfn distance(half p0, half p1); | ||
| 2643 | half __ovld __cnfn distance(half2 p0, half2 p1); | ||
| 2644 | @@ -10503,12 +10516,12 @@ float __ovld __cnfn length(float p); | ||
| 2645 | float __ovld __cnfn length(float2 p); | ||
| 2646 | float __ovld __cnfn length(float3 p); | ||
| 2647 | float __ovld __cnfn length(float4 p); | ||
| 2648 | -#ifdef cl_khr_fp64 | ||
| 2649 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2650 | double __ovld __cnfn length(double p); | ||
| 2651 | double __ovld __cnfn length(double2 p); | ||
| 2652 | double __ovld __cnfn length(double3 p); | ||
| 2653 | double __ovld __cnfn length(double4 p); | ||
| 2654 | -#endif //cl_khr_fp64 | ||
| 2655 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2656 | #ifdef cl_khr_fp16 | ||
| 2657 | half __ovld __cnfn length(half p); | ||
| 2658 | half __ovld __cnfn length(half2 p); | ||
| 2659 | @@ -10524,12 +10537,12 @@ float __ovld __cnfn normalize(float p); | ||
| 2660 | float2 __ovld __cnfn normalize(float2 p); | ||
| 2661 | float3 __ovld __cnfn normalize(float3 p); | ||
| 2662 | float4 __ovld __cnfn normalize(float4 p); | ||
| 2663 | -#ifdef cl_khr_fp64 | ||
| 2664 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2665 | double __ovld __cnfn normalize(double p); | ||
| 2666 | double2 __ovld __cnfn normalize(double2 p); | ||
| 2667 | double3 __ovld __cnfn normalize(double3 p); | ||
| 2668 | double4 __ovld __cnfn normalize(double4 p); | ||
| 2669 | -#endif //cl_khr_fp64 | ||
| 2670 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2671 | #ifdef cl_khr_fp16 | ||
| 2672 | half __ovld __cnfn normalize(half p); | ||
| 2673 | half2 __ovld __cnfn normalize(half2 p); | ||
| 2674 | @@ -10610,14 +10623,14 @@ int3 __ovld __cnfn isequal(float3 x, float3 y); | ||
| 2675 | int4 __ovld __cnfn isequal(float4 x, float4 y); | ||
| 2676 | int8 __ovld __cnfn isequal(float8 x, float8 y); | ||
| 2677 | int16 __ovld __cnfn isequal(float16 x, float16 y); | ||
| 2678 | -#ifdef cl_khr_fp64 | ||
| 2679 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2680 | int __ovld __cnfn isequal(double x, double y); | ||
| 2681 | long2 __ovld __cnfn isequal(double2 x, double2 y); | ||
| 2682 | long3 __ovld __cnfn isequal(double3 x, double3 y); | ||
| 2683 | long4 __ovld __cnfn isequal(double4 x, double4 y); | ||
| 2684 | long8 __ovld __cnfn isequal(double8 x, double8 y); | ||
| 2685 | long16 __ovld __cnfn isequal(double16 x, double16 y); | ||
| 2686 | -#endif //cl_khr_fp64 | ||
| 2687 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2688 | #ifdef cl_khr_fp16 | ||
| 2689 | int __ovld __cnfn isequal(half x, half y); | ||
| 2690 | short2 __ovld __cnfn isequal(half2 x, half2 y); | ||
| 2691 | @@ -10636,14 +10649,14 @@ int3 __ovld __cnfn isnotequal(float3 x, float3 y); | ||
| 2692 | int4 __ovld __cnfn isnotequal(float4 x, float4 y); | ||
| 2693 | int8 __ovld __cnfn isnotequal(float8 x, float8 y); | ||
| 2694 | int16 __ovld __cnfn isnotequal(float16 x, float16 y); | ||
| 2695 | -#ifdef cl_khr_fp64 | ||
| 2696 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2697 | int __ovld __cnfn isnotequal(double x, double y); | ||
| 2698 | long2 __ovld __cnfn isnotequal(double2 x, double2 y); | ||
| 2699 | long3 __ovld __cnfn isnotequal(double3 x, double3 y); | ||
| 2700 | long4 __ovld __cnfn isnotequal(double4 x, double4 y); | ||
| 2701 | long8 __ovld __cnfn isnotequal(double8 x, double8 y); | ||
| 2702 | long16 __ovld __cnfn isnotequal(double16 x, double16 y); | ||
| 2703 | -#endif //cl_khr_fp64 | ||
| 2704 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2705 | #ifdef cl_khr_fp16 | ||
| 2706 | int __ovld __cnfn isnotequal(half x, half y); | ||
| 2707 | short2 __ovld __cnfn isnotequal(half2 x, half2 y); | ||
| 2708 | @@ -10662,14 +10675,14 @@ int3 __ovld __cnfn isgreater(float3 x, float3 y); | ||
| 2709 | int4 __ovld __cnfn isgreater(float4 x, float4 y); | ||
| 2710 | int8 __ovld __cnfn isgreater(float8 x, float8 y); | ||
| 2711 | int16 __ovld __cnfn isgreater(float16 x, float16 y); | ||
| 2712 | -#ifdef cl_khr_fp64 | ||
| 2713 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2714 | int __ovld __cnfn isgreater(double x, double y); | ||
| 2715 | long2 __ovld __cnfn isgreater(double2 x, double2 y); | ||
| 2716 | long3 __ovld __cnfn isgreater(double3 x, double3 y); | ||
| 2717 | long4 __ovld __cnfn isgreater(double4 x, double4 y); | ||
| 2718 | long8 __ovld __cnfn isgreater(double8 x, double8 y); | ||
| 2719 | long16 __ovld __cnfn isgreater(double16 x, double16 y); | ||
| 2720 | -#endif //cl_khr_fp64 | ||
| 2721 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2722 | #ifdef cl_khr_fp16 | ||
| 2723 | int __ovld __cnfn isgreater(half x, half y); | ||
| 2724 | short2 __ovld __cnfn isgreater(half2 x, half2 y); | ||
| 2725 | @@ -10688,14 +10701,14 @@ int3 __ovld __cnfn isgreaterequal(float3 x, float3 y); | ||
| 2726 | int4 __ovld __cnfn isgreaterequal(float4 x, float4 y); | ||
| 2727 | int8 __ovld __cnfn isgreaterequal(float8 x, float8 y); | ||
| 2728 | int16 __ovld __cnfn isgreaterequal(float16 x, float16 y); | ||
| 2729 | -#ifdef cl_khr_fp64 | ||
| 2730 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2731 | int __ovld __cnfn isgreaterequal(double x, double y); | ||
| 2732 | long2 __ovld __cnfn isgreaterequal(double2 x, double2 y); | ||
| 2733 | long3 __ovld __cnfn isgreaterequal(double3 x, double3 y); | ||
| 2734 | long4 __ovld __cnfn isgreaterequal(double4 x, double4 y); | ||
| 2735 | long8 __ovld __cnfn isgreaterequal(double8 x, double8 y); | ||
| 2736 | long16 __ovld __cnfn isgreaterequal(double16 x, double16 y); | ||
| 2737 | -#endif //cl_khr_fp64 | ||
| 2738 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2739 | #ifdef cl_khr_fp16 | ||
| 2740 | int __ovld __cnfn isgreaterequal(half x, half y); | ||
| 2741 | short2 __ovld __cnfn isgreaterequal(half2 x, half2 y); | ||
| 2742 | @@ -10714,14 +10727,14 @@ int3 __ovld __cnfn isless(float3 x, float3 y); | ||
| 2743 | int4 __ovld __cnfn isless(float4 x, float4 y); | ||
| 2744 | int8 __ovld __cnfn isless(float8 x, float8 y); | ||
| 2745 | int16 __ovld __cnfn isless(float16 x, float16 y); | ||
| 2746 | -#ifdef cl_khr_fp64 | ||
| 2747 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2748 | int __ovld __cnfn isless(double x, double y); | ||
| 2749 | long2 __ovld __cnfn isless(double2 x, double2 y); | ||
| 2750 | long3 __ovld __cnfn isless(double3 x, double3 y); | ||
| 2751 | long4 __ovld __cnfn isless(double4 x, double4 y); | ||
| 2752 | long8 __ovld __cnfn isless(double8 x, double8 y); | ||
| 2753 | long16 __ovld __cnfn isless(double16 x, double16 y); | ||
| 2754 | -#endif //cl_khr_fp64 | ||
| 2755 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2756 | #ifdef cl_khr_fp16 | ||
| 2757 | int __ovld __cnfn isless(half x, half y); | ||
| 2758 | short2 __ovld __cnfn isless(half2 x, half2 y); | ||
| 2759 | @@ -10740,14 +10753,14 @@ int3 __ovld __cnfn islessequal(float3 x, float3 y); | ||
| 2760 | int4 __ovld __cnfn islessequal(float4 x, float4 y); | ||
| 2761 | int8 __ovld __cnfn islessequal(float8 x, float8 y); | ||
| 2762 | int16 __ovld __cnfn islessequal(float16 x, float16 y); | ||
| 2763 | -#ifdef cl_khr_fp64 | ||
| 2764 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2765 | int __ovld __cnfn islessequal(double x, double y); | ||
| 2766 | long2 __ovld __cnfn islessequal(double2 x, double2 y); | ||
| 2767 | long3 __ovld __cnfn islessequal(double3 x, double3 y); | ||
| 2768 | long4 __ovld __cnfn islessequal(double4 x, double4 y); | ||
| 2769 | long8 __ovld __cnfn islessequal(double8 x, double8 y); | ||
| 2770 | long16 __ovld __cnfn islessequal(double16 x, double16 y); | ||
| 2771 | -#endif //cl_khr_fp64 | ||
| 2772 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2773 | #ifdef cl_khr_fp16 | ||
| 2774 | int __ovld __cnfn islessequal(half x, half y); | ||
| 2775 | short2 __ovld __cnfn islessequal(half2 x, half2 y); | ||
| 2776 | @@ -10767,14 +10780,14 @@ int3 __ovld __cnfn islessgreater(float3 x, float3 y); | ||
| 2777 | int4 __ovld __cnfn islessgreater(float4 x, float4 y); | ||
| 2778 | int8 __ovld __cnfn islessgreater(float8 x, float8 y); | ||
| 2779 | int16 __ovld __cnfn islessgreater(float16 x, float16 y); | ||
| 2780 | -#ifdef cl_khr_fp64 | ||
| 2781 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2782 | int __ovld __cnfn islessgreater(double x, double y); | ||
| 2783 | long2 __ovld __cnfn islessgreater(double2 x, double2 y); | ||
| 2784 | long3 __ovld __cnfn islessgreater(double3 x, double3 y); | ||
| 2785 | long4 __ovld __cnfn islessgreater(double4 x, double4 y); | ||
| 2786 | long8 __ovld __cnfn islessgreater(double8 x, double8 y); | ||
| 2787 | long16 __ovld __cnfn islessgreater(double16 x, double16 y); | ||
| 2788 | -#endif //cl_khr_fp64 | ||
| 2789 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2790 | #ifdef cl_khr_fp16 | ||
| 2791 | int __ovld __cnfn islessgreater(half x, half y); | ||
| 2792 | short2 __ovld __cnfn islessgreater(half2 x, half2 y); | ||
| 2793 | @@ -10793,14 +10806,14 @@ int3 __ovld __cnfn isfinite(float3); | ||
| 2794 | int4 __ovld __cnfn isfinite(float4); | ||
| 2795 | int8 __ovld __cnfn isfinite(float8); | ||
| 2796 | int16 __ovld __cnfn isfinite(float16); | ||
| 2797 | -#ifdef cl_khr_fp64 | ||
| 2798 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2799 | int __ovld __cnfn isfinite(double); | ||
| 2800 | long2 __ovld __cnfn isfinite(double2); | ||
| 2801 | long3 __ovld __cnfn isfinite(double3); | ||
| 2802 | long4 __ovld __cnfn isfinite(double4); | ||
| 2803 | long8 __ovld __cnfn isfinite(double8); | ||
| 2804 | long16 __ovld __cnfn isfinite(double16); | ||
| 2805 | -#endif //cl_khr_fp64 | ||
| 2806 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2807 | #ifdef cl_khr_fp16 | ||
| 2808 | int __ovld __cnfn isfinite(half); | ||
| 2809 | short2 __ovld __cnfn isfinite(half2); | ||
| 2810 | @@ -10819,14 +10832,14 @@ int3 __ovld __cnfn isinf(float3); | ||
| 2811 | int4 __ovld __cnfn isinf(float4); | ||
| 2812 | int8 __ovld __cnfn isinf(float8); | ||
| 2813 | int16 __ovld __cnfn isinf(float16); | ||
| 2814 | -#ifdef cl_khr_fp64 | ||
| 2815 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2816 | int __ovld __cnfn isinf(double); | ||
| 2817 | long2 __ovld __cnfn isinf(double2); | ||
| 2818 | long3 __ovld __cnfn isinf(double3); | ||
| 2819 | long4 __ovld __cnfn isinf(double4); | ||
| 2820 | long8 __ovld __cnfn isinf(double8); | ||
| 2821 | long16 __ovld __cnfn isinf(double16); | ||
| 2822 | -#endif //cl_khr_fp64 | ||
| 2823 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2824 | #ifdef cl_khr_fp16 | ||
| 2825 | int __ovld __cnfn isinf(half); | ||
| 2826 | short2 __ovld __cnfn isinf(half2); | ||
| 2827 | @@ -10845,14 +10858,14 @@ int3 __ovld __cnfn isnan(float3); | ||
| 2828 | int4 __ovld __cnfn isnan(float4); | ||
| 2829 | int8 __ovld __cnfn isnan(float8); | ||
| 2830 | int16 __ovld __cnfn isnan(float16); | ||
| 2831 | -#ifdef cl_khr_fp64 | ||
| 2832 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2833 | int __ovld __cnfn isnan(double); | ||
| 2834 | long2 __ovld __cnfn isnan(double2); | ||
| 2835 | long3 __ovld __cnfn isnan(double3); | ||
| 2836 | long4 __ovld __cnfn isnan(double4); | ||
| 2837 | long8 __ovld __cnfn isnan(double8); | ||
| 2838 | long16 __ovld __cnfn isnan(double16); | ||
| 2839 | -#endif //cl_khr_fp64 | ||
| 2840 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2841 | #ifdef cl_khr_fp16 | ||
| 2842 | int __ovld __cnfn isnan(half); | ||
| 2843 | short2 __ovld __cnfn isnan(half2); | ||
| 2844 | @@ -10871,14 +10884,14 @@ int3 __ovld __cnfn isnormal(float3); | ||
| 2845 | int4 __ovld __cnfn isnormal(float4); | ||
| 2846 | int8 __ovld __cnfn isnormal(float8); | ||
| 2847 | int16 __ovld __cnfn isnormal(float16); | ||
| 2848 | -#ifdef cl_khr_fp64 | ||
| 2849 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2850 | int __ovld __cnfn isnormal(double); | ||
| 2851 | long2 __ovld __cnfn isnormal(double2); | ||
| 2852 | long3 __ovld __cnfn isnormal(double3); | ||
| 2853 | long4 __ovld __cnfn isnormal(double4); | ||
| 2854 | long8 __ovld __cnfn isnormal(double8); | ||
| 2855 | long16 __ovld __cnfn isnormal(double16); | ||
| 2856 | -#endif //cl_khr_fp64 | ||
| 2857 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2858 | #ifdef cl_khr_fp16 | ||
| 2859 | int __ovld __cnfn isnormal(half); | ||
| 2860 | short2 __ovld __cnfn isnormal(half2); | ||
| 2861 | @@ -10899,14 +10912,14 @@ int3 __ovld __cnfn isordered(float3 x, float3 y); | ||
| 2862 | int4 __ovld __cnfn isordered(float4 x, float4 y); | ||
| 2863 | int8 __ovld __cnfn isordered(float8 x, float8 y); | ||
| 2864 | int16 __ovld __cnfn isordered(float16 x, float16 y); | ||
| 2865 | -#ifdef cl_khr_fp64 | ||
| 2866 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2867 | int __ovld __cnfn isordered(double x, double y); | ||
| 2868 | long2 __ovld __cnfn isordered(double2 x, double2 y); | ||
| 2869 | long3 __ovld __cnfn isordered(double3 x, double3 y); | ||
| 2870 | long4 __ovld __cnfn isordered(double4 x, double4 y); | ||
| 2871 | long8 __ovld __cnfn isordered(double8 x, double8 y); | ||
| 2872 | long16 __ovld __cnfn isordered(double16 x, double16 y); | ||
| 2873 | -#endif //cl_khr_fp64 | ||
| 2874 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2875 | #ifdef cl_khr_fp16 | ||
| 2876 | int __ovld __cnfn isordered(half x, half y); | ||
| 2877 | short2 __ovld __cnfn isordered(half2 x, half2 y); | ||
| 2878 | @@ -10927,14 +10940,14 @@ int3 __ovld __cnfn isunordered(float3 x, float3 y); | ||
| 2879 | int4 __ovld __cnfn isunordered(float4 x, float4 y); | ||
| 2880 | int8 __ovld __cnfn isunordered(float8 x, float8 y); | ||
| 2881 | int16 __ovld __cnfn isunordered(float16 x, float16 y); | ||
| 2882 | -#ifdef cl_khr_fp64 | ||
| 2883 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2884 | int __ovld __cnfn isunordered(double x, double y); | ||
| 2885 | long2 __ovld __cnfn isunordered(double2 x, double2 y); | ||
| 2886 | long3 __ovld __cnfn isunordered(double3 x, double3 y); | ||
| 2887 | long4 __ovld __cnfn isunordered(double4 x, double4 y); | ||
| 2888 | long8 __ovld __cnfn isunordered(double8 x, double8 y); | ||
| 2889 | long16 __ovld __cnfn isunordered(double16 x, double16 y); | ||
| 2890 | -#endif //cl_khr_fp64 | ||
| 2891 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2892 | #ifdef cl_khr_fp16 | ||
| 2893 | int __ovld __cnfn isunordered(half x, half y); | ||
| 2894 | short2 __ovld __cnfn isunordered(half2 x, half2 y); | ||
| 2895 | @@ -10957,14 +10970,14 @@ int3 __ovld __cnfn signbit(float3); | ||
| 2896 | int4 __ovld __cnfn signbit(float4); | ||
| 2897 | int8 __ovld __cnfn signbit(float8); | ||
| 2898 | int16 __ovld __cnfn signbit(float16); | ||
| 2899 | -#ifdef cl_khr_fp64 | ||
| 2900 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2901 | int __ovld __cnfn signbit(double); | ||
| 2902 | long2 __ovld __cnfn signbit(double2); | ||
| 2903 | long3 __ovld __cnfn signbit(double3); | ||
| 2904 | long4 __ovld __cnfn signbit(double4); | ||
| 2905 | long8 __ovld __cnfn signbit(double8); | ||
| 2906 | long16 __ovld __cnfn signbit(double16); | ||
| 2907 | -#endif //cl_khr_fp64 | ||
| 2908 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2909 | #ifdef cl_khr_fp16 | ||
| 2910 | int __ovld __cnfn signbit(half); | ||
| 2911 | short2 __ovld __cnfn signbit(half2); | ||
| 2912 | @@ -11091,14 +11104,14 @@ float3 __ovld __cnfn bitselect(float3 a, float3 b, float3 c); | ||
| 2913 | float4 __ovld __cnfn bitselect(float4 a, float4 b, float4 c); | ||
| 2914 | float8 __ovld __cnfn bitselect(float8 a, float8 b, float8 c); | ||
| 2915 | float16 __ovld __cnfn bitselect(float16 a, float16 b, float16 c); | ||
| 2916 | -#ifdef cl_khr_fp64 | ||
| 2917 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2918 | double __ovld __cnfn bitselect(double a, double b, double c); | ||
| 2919 | double2 __ovld __cnfn bitselect(double2 a, double2 b, double2 c); | ||
| 2920 | double3 __ovld __cnfn bitselect(double3 a, double3 b, double3 c); | ||
| 2921 | double4 __ovld __cnfn bitselect(double4 a, double4 b, double4 c); | ||
| 2922 | double8 __ovld __cnfn bitselect(double8 a, double8 b, double8 c); | ||
| 2923 | double16 __ovld __cnfn bitselect(double16 a, double16 b, double16 c); | ||
| 2924 | -#endif //cl_khr_fp64 | ||
| 2925 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2926 | #ifdef cl_khr_fp16 | ||
| 2927 | half __ovld __cnfn bitselect(half a, half b, half c); | ||
| 2928 | half2 __ovld __cnfn bitselect(half2 a, half2 b, half2 c); | ||
| 2929 | @@ -11231,7 +11244,7 @@ ulong8 __ovld __cnfn select(ulong8 a, ulong8 b, ulong8 c); | ||
| 2930 | long16 __ovld __cnfn select(long16 a, long16 b, ulong16 c); | ||
| 2931 | ulong16 __ovld __cnfn select(ulong16 a, ulong16 b, ulong16 c); | ||
| 2932 | |||
| 2933 | -#ifdef cl_khr_fp64 | ||
| 2934 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2935 | double __ovld __cnfn select(double a, double b, long c); | ||
| 2936 | double2 __ovld __cnfn select(double2 a, double2 b, long2 c); | ||
| 2937 | double3 __ovld __cnfn select(double3 a, double3 b, long3 c); | ||
| 2938 | @@ -11244,7 +11257,7 @@ double3 __ovld __cnfn select(double3 a, double3 b, ulong3 c); | ||
| 2939 | double4 __ovld __cnfn select(double4 a, double4 b, ulong4 c); | ||
| 2940 | double8 __ovld __cnfn select(double8 a, double8 b, ulong8 c); | ||
| 2941 | double16 __ovld __cnfn select(double16 a, double16 b, ulong16 c); | ||
| 2942 | -#endif //cl_khr_fp64 | ||
| 2943 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2944 | #ifdef cl_khr_fp16 | ||
| 2945 | half __ovld __cnfn select(half a, half b, short c); | ||
| 2946 | half2 __ovld __cnfn select(half2 a, half2 b, short2 c); | ||
| 2947 | @@ -11323,13 +11336,13 @@ uint16 __ovld vload16(size_t offset, const __constant uint *p); | ||
| 2948 | long16 __ovld vload16(size_t offset, const __constant long *p); | ||
| 2949 | ulong16 __ovld vload16(size_t offset, const __constant ulong *p); | ||
| 2950 | float16 __ovld vload16(size_t offset, const __constant float *p); | ||
| 2951 | -#ifdef cl_khr_fp64 | ||
| 2952 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2953 | double2 __ovld vload2(size_t offset, const __constant double *p); | ||
| 2954 | double3 __ovld vload3(size_t offset, const __constant double *p); | ||
| 2955 | double4 __ovld vload4(size_t offset, const __constant double *p); | ||
| 2956 | double8 __ovld vload8(size_t offset, const __constant double *p); | ||
| 2957 | double16 __ovld vload16(size_t offset, const __constant double *p); | ||
| 2958 | -#endif //cl_khr_fp64 | ||
| 2959 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2960 | |||
| 2961 | #ifdef cl_khr_fp16 | ||
| 2962 | half __ovld vload(size_t offset, const __constant half *p); | ||
| 2963 | @@ -11340,7 +11353,7 @@ half8 __ovld vload8(size_t offset, const __constant half *p); | ||
| 2964 | half16 __ovld vload16(size_t offset, const __constant half *p); | ||
| 2965 | #endif //cl_khr_fp16 | ||
| 2966 | |||
| 2967 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2968 | +#ifdef __opencl_c_generic_address_space | ||
| 2969 | char2 __ovld vload2(size_t offset, const char *p); | ||
| 2970 | uchar2 __ovld vload2(size_t offset, const uchar *p); | ||
| 2971 | short2 __ovld vload2(size_t offset, const short *p); | ||
| 2972 | @@ -11387,13 +11400,13 @@ long16 __ovld vload16(size_t offset, const long *p); | ||
| 2973 | ulong16 __ovld vload16(size_t offset, const ulong *p); | ||
| 2974 | float16 __ovld vload16(size_t offset, const float *p); | ||
| 2975 | |||
| 2976 | -#ifdef cl_khr_fp64 | ||
| 2977 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2978 | double2 __ovld vload2(size_t offset, const double *p); | ||
| 2979 | double3 __ovld vload3(size_t offset, const double *p); | ||
| 2980 | double4 __ovld vload4(size_t offset, const double *p); | ||
| 2981 | double8 __ovld vload8(size_t offset, const double *p); | ||
| 2982 | double16 __ovld vload16(size_t offset, const double *p); | ||
| 2983 | -#endif //cl_khr_fp64 | ||
| 2984 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2985 | |||
| 2986 | #ifdef cl_khr_fp16 | ||
| 2987 | half __ovld vload(size_t offset, const half *p); | ||
| 2988 | @@ -11403,7 +11416,7 @@ half4 __ovld vload4(size_t offset, const half *p); | ||
| 2989 | half8 __ovld vload8(size_t offset, const half *p); | ||
| 2990 | half16 __ovld vload16(size_t offset, const half *p); | ||
| 2991 | #endif //cl_khr_fp16 | ||
| 2992 | -#else | ||
| 2993 | +#endif //__opencl_c_generic_address_space | ||
| 2994 | char2 __ovld vload2(size_t offset, const __global char *p); | ||
| 2995 | uchar2 __ovld vload2(size_t offset, const __global uchar *p); | ||
| 2996 | short2 __ovld vload2(size_t offset, const __global short *p); | ||
| 2997 | @@ -11540,7 +11553,7 @@ long16 __ovld vload16(size_t offset, const __private long *p); | ||
| 2998 | ulong16 __ovld vload16(size_t offset, const __private ulong *p); | ||
| 2999 | float16 __ovld vload16(size_t offset, const __private float *p); | ||
| 3000 | |||
| 3001 | -#ifdef cl_khr_fp64 | ||
| 3002 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3003 | double2 __ovld vload2(size_t offset, const __global double *p); | ||
| 3004 | double3 __ovld vload3(size_t offset, const __global double *p); | ||
| 3005 | double4 __ovld vload4(size_t offset, const __global double *p); | ||
| 3006 | @@ -11556,7 +11569,7 @@ double3 __ovld vload3(size_t offset, const __private double *p); | ||
| 3007 | double4 __ovld vload4(size_t offset, const __private double *p); | ||
| 3008 | double8 __ovld vload8(size_t offset, const __private double *p); | ||
| 3009 | double16 __ovld vload16(size_t offset, const __private double *p); | ||
| 3010 | -#endif //cl_khr_fp64 | ||
| 3011 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3012 | |||
| 3013 | #ifdef cl_khr_fp16 | ||
| 3014 | half __ovld vload(size_t offset, const __global half *p); | ||
| 3015 | @@ -11578,9 +11591,8 @@ half4 __ovld vload4(size_t offset, const __private half *p); | ||
| 3016 | half8 __ovld vload8(size_t offset, const __private half *p); | ||
| 3017 | half16 __ovld vload16(size_t offset, const __private half *p); | ||
| 3018 | #endif //cl_khr_fp16 | ||
| 3019 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3020 | |||
| 3021 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3022 | +#ifdef __opencl_c_generic_address_space | ||
| 3023 | void __ovld vstore2(char2 data, size_t offset, char *p); | ||
| 3024 | void __ovld vstore2(uchar2 data, size_t offset, uchar *p); | ||
| 3025 | void __ovld vstore2(short2 data, size_t offset, short *p); | ||
| 3026 | @@ -11626,13 +11638,13 @@ void __ovld vstore16(uint16 data, size_t offset, uint *p); | ||
| 3027 | void __ovld vstore16(long16 data, size_t offset, long *p); | ||
| 3028 | void __ovld vstore16(ulong16 data, size_t offset, ulong *p); | ||
| 3029 | void __ovld vstore16(float16 data, size_t offset, float *p); | ||
| 3030 | -#ifdef cl_khr_fp64 | ||
| 3031 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3032 | void __ovld vstore2(double2 data, size_t offset, double *p); | ||
| 3033 | void __ovld vstore3(double3 data, size_t offset, double *p); | ||
| 3034 | void __ovld vstore4(double4 data, size_t offset, double *p); | ||
| 3035 | void __ovld vstore8(double8 data, size_t offset, double *p); | ||
| 3036 | void __ovld vstore16(double16 data, size_t offset, double *p); | ||
| 3037 | -#endif //cl_khr_fp64 | ||
| 3038 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3039 | #ifdef cl_khr_fp16 | ||
| 3040 | void __ovld vstore(half data, size_t offset, half *p); | ||
| 3041 | void __ovld vstore2(half2 data, size_t offset, half *p); | ||
| 3042 | @@ -11641,7 +11653,7 @@ void __ovld vstore4(half4 data, size_t offset, half *p); | ||
| 3043 | void __ovld vstore8(half8 data, size_t offset, half *p); | ||
| 3044 | void __ovld vstore16(half16 data, size_t offset, half *p); | ||
| 3045 | #endif //cl_khr_fp16 | ||
| 3046 | -#else | ||
| 3047 | +#endif //__opencl_c_generic_address_space | ||
| 3048 | void __ovld vstore2(char2 data, size_t offset, __global char *p); | ||
| 3049 | void __ovld vstore2(uchar2 data, size_t offset, __global uchar *p); | ||
| 3050 | void __ovld vstore2(short2 data, size_t offset, __global short *p); | ||
| 3051 | @@ -11777,7 +11789,7 @@ void __ovld vstore16(uint16 data, size_t offset, __private uint *p); | ||
| 3052 | void __ovld vstore16(long16 data, size_t offset, __private long *p); | ||
| 3053 | void __ovld vstore16(ulong16 data, size_t offset, __private ulong *p); | ||
| 3054 | void __ovld vstore16(float16 data, size_t offset, __private float *p); | ||
| 3055 | -#ifdef cl_khr_fp64 | ||
| 3056 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3057 | void __ovld vstore2(double2 data, size_t offset, __global double *p); | ||
| 3058 | void __ovld vstore3(double3 data, size_t offset, __global double *p); | ||
| 3059 | void __ovld vstore4(double4 data, size_t offset, __global double *p); | ||
| 3060 | @@ -11793,7 +11805,7 @@ void __ovld vstore3(double3 data, size_t offset, __private double *p); | ||
| 3061 | void __ovld vstore4(double4 data, size_t offset, __private double *p); | ||
| 3062 | void __ovld vstore8(double8 data, size_t offset, __private double *p); | ||
| 3063 | void __ovld vstore16(double16 data, size_t offset, __private double *p); | ||
| 3064 | -#endif //cl_khr_fp64 | ||
| 3065 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3066 | #ifdef cl_khr_fp16 | ||
| 3067 | void __ovld vstore(half data, size_t offset, __global half *p); | ||
| 3068 | void __ovld vstore2(half2 data, size_t offset, __global half *p); | ||
| 3069 | @@ -11814,7 +11826,6 @@ void __ovld vstore4(half4 data, size_t offset, __private half *p); | ||
| 3070 | void __ovld vstore8(half8 data, size_t offset, __private half *p); | ||
| 3071 | void __ovld vstore16(half16 data, size_t offset, __private half *p); | ||
| 3072 | #endif //cl_khr_fp16 | ||
| 3073 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3074 | |||
| 3075 | /** | ||
| 3076 | * Read sizeof (half) bytes of data from address | ||
| 3077 | @@ -11825,13 +11836,12 @@ void __ovld vstore16(half16 data, size_t offset, __private half *p); | ||
| 3078 | * must be 16-bit aligned. | ||
| 3079 | */ | ||
| 3080 | float __ovld vload_half(size_t offset, const __constant half *p); | ||
| 3081 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3082 | +#ifdef __opencl_c_generic_address_space | ||
| 3083 | float __ovld vload_half(size_t offset, const half *p); | ||
| 3084 | -#else | ||
| 3085 | +#endif //__opencl_c_generic_address_space | ||
| 3086 | float __ovld vload_half(size_t offset, const __global half *p); | ||
| 3087 | float __ovld vload_half(size_t offset, const __local half *p); | ||
| 3088 | float __ovld vload_half(size_t offset, const __private half *p); | ||
| 3089 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3090 | |||
| 3091 | /** | ||
| 3092 | * Read sizeof (halfn) bytes of data from address | ||
| 3093 | @@ -11846,13 +11856,13 @@ float3 __ovld vload_half3(size_t offset, const __constant half *p); | ||
| 3094 | float4 __ovld vload_half4(size_t offset, const __constant half *p); | ||
| 3095 | float8 __ovld vload_half8(size_t offset, const __constant half *p); | ||
| 3096 | float16 __ovld vload_half16(size_t offset, const __constant half *p); | ||
| 3097 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3098 | +#ifdef __opencl_c_generic_address_space | ||
| 3099 | float2 __ovld vload_half2(size_t offset, const half *p); | ||
| 3100 | float3 __ovld vload_half3(size_t offset, const half *p); | ||
| 3101 | float4 __ovld vload_half4(size_t offset, const half *p); | ||
| 3102 | float8 __ovld vload_half8(size_t offset, const half *p); | ||
| 3103 | float16 __ovld vload_half16(size_t offset, const half *p); | ||
| 3104 | -#else | ||
| 3105 | +#endif //__opencl_c_generic_address_space | ||
| 3106 | float2 __ovld vload_half2(size_t offset, const __global half *p); | ||
| 3107 | float3 __ovld vload_half3(size_t offset, const __global half *p); | ||
| 3108 | float4 __ovld vload_half4(size_t offset, const __global half *p); | ||
| 3109 | @@ -11868,7 +11878,6 @@ float3 __ovld vload_half3(size_t offset, const __private half *p); | ||
| 3110 | float4 __ovld vload_half4(size_t offset, const __private half *p); | ||
| 3111 | float8 __ovld vload_half8(size_t offset, const __private half *p); | ||
| 3112 | float16 __ovld vload_half16(size_t offset, const __private half *p); | ||
| 3113 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3114 | |||
| 3115 | /** | ||
| 3116 | * The float value given by data is first | ||
| 3117 | @@ -11881,20 +11890,20 @@ float16 __ovld vload_half16(size_t offset, const __private half *p); | ||
| 3118 | * The default current rounding mode is round to | ||
| 3119 | * nearest even. | ||
| 3120 | */ | ||
| 3121 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3122 | +#ifdef __opencl_c_generic_address_space | ||
| 3123 | void __ovld vstore_half(float data, size_t offset, half *p); | ||
| 3124 | void __ovld vstore_half_rte(float data, size_t offset, half *p); | ||
| 3125 | void __ovld vstore_half_rtz(float data, size_t offset, half *p); | ||
| 3126 | void __ovld vstore_half_rtp(float data, size_t offset, half *p); | ||
| 3127 | void __ovld vstore_half_rtn(float data, size_t offset, half *p); | ||
| 3128 | -#ifdef cl_khr_fp64 | ||
| 3129 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3130 | void __ovld vstore_half(double data, size_t offset, half *p); | ||
| 3131 | void __ovld vstore_half_rte(double data, size_t offset, half *p); | ||
| 3132 | void __ovld vstore_half_rtz(double data, size_t offset, half *p); | ||
| 3133 | void __ovld vstore_half_rtp(double data, size_t offset, half *p); | ||
| 3134 | void __ovld vstore_half_rtn(double data, size_t offset, half *p); | ||
| 3135 | -#endif //cl_khr_fp64 | ||
| 3136 | -#else | ||
| 3137 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3138 | +#endif //__opencl_c_generic_address_space | ||
| 3139 | void __ovld vstore_half(float data, size_t offset, __global half *p); | ||
| 3140 | void __ovld vstore_half_rte(float data, size_t offset, __global half *p); | ||
| 3141 | void __ovld vstore_half_rtz(float data, size_t offset, __global half *p); | ||
| 3142 | @@ -11910,7 +11919,7 @@ void __ovld vstore_half_rte(float data, size_t offset, __private half *p); | ||
| 3143 | void __ovld vstore_half_rtz(float data, size_t offset, __private half *p); | ||
| 3144 | void __ovld vstore_half_rtp(float data, size_t offset, __private half *p); | ||
| 3145 | void __ovld vstore_half_rtn(float data, size_t offset, __private half *p); | ||
| 3146 | -#ifdef cl_khr_fp64 | ||
| 3147 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3148 | void __ovld vstore_half(double data, size_t offset, __global half *p); | ||
| 3149 | void __ovld vstore_half_rte(double data, size_t offset, __global half *p); | ||
| 3150 | void __ovld vstore_half_rtz(double data, size_t offset, __global half *p); | ||
| 3151 | @@ -11926,8 +11935,7 @@ void __ovld vstore_half_rte(double data, size_t offset, __private half *p); | ||
| 3152 | void __ovld vstore_half_rtz(double data, size_t offset, __private half *p); | ||
| 3153 | void __ovld vstore_half_rtp(double data, size_t offset, __private half *p); | ||
| 3154 | void __ovld vstore_half_rtn(double data, size_t offset, __private half *p); | ||
| 3155 | -#endif //cl_khr_fp64 | ||
| 3156 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3157 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3158 | |||
| 3159 | /** | ||
| 3160 | * The floatn value given by data is converted to | ||
| 3161 | @@ -11940,7 +11948,7 @@ void __ovld vstore_half_rtn(double data, size_t offset, __private half *p); | ||
| 3162 | * The default current rounding mode is round to | ||
| 3163 | * nearest even. | ||
| 3164 | */ | ||
| 3165 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3166 | +#ifdef __opencl_c_generic_address_space | ||
| 3167 | void __ovld vstore_half2(float2 data, size_t offset, half *p); | ||
| 3168 | void __ovld vstore_half3(float3 data, size_t offset, half *p); | ||
| 3169 | void __ovld vstore_half4(float4 data, size_t offset, half *p); | ||
| 3170 | @@ -11966,7 +11974,7 @@ void __ovld vstore_half3_rtn(float3 data, size_t offset, half *p); | ||
| 3171 | void __ovld vstore_half4_rtn(float4 data, size_t offset, half *p); | ||
| 3172 | void __ovld vstore_half8_rtn(float8 data, size_t offset, half *p); | ||
| 3173 | void __ovld vstore_half16_rtn(float16 data, size_t offset, half *p); | ||
| 3174 | -#ifdef cl_khr_fp64 | ||
| 3175 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3176 | void __ovld vstore_half2(double2 data, size_t offset, half *p); | ||
| 3177 | void __ovld vstore_half3(double3 data, size_t offset, half *p); | ||
| 3178 | void __ovld vstore_half4(double4 data, size_t offset, half *p); | ||
| 3179 | @@ -11992,8 +12000,8 @@ void __ovld vstore_half3_rtn(double3 data, size_t offset, half *p); | ||
| 3180 | void __ovld vstore_half4_rtn(double4 data, size_t offset, half *p); | ||
| 3181 | void __ovld vstore_half8_rtn(double8 data, size_t offset, half *p); | ||
| 3182 | void __ovld vstore_half16_rtn(double16 data, size_t offset, half *p); | ||
| 3183 | -#endif //cl_khr_fp64 | ||
| 3184 | -#else | ||
| 3185 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3186 | +#endif //__opencl_c_generic_address_space | ||
| 3187 | void __ovld vstore_half2(float2 data, size_t offset, __global half *p); | ||
| 3188 | void __ovld vstore_half3(float3 data, size_t offset, __global half *p); | ||
| 3189 | void __ovld vstore_half4(float4 data, size_t offset, __global half *p); | ||
| 3190 | @@ -12069,7 +12077,7 @@ void __ovld vstore_half3_rtn(float3 data, size_t offset, __private half *p); | ||
| 3191 | void __ovld vstore_half4_rtn(float4 data, size_t offset, __private half *p); | ||
| 3192 | void __ovld vstore_half8_rtn(float8 data, size_t offset, __private half *p); | ||
| 3193 | void __ovld vstore_half16_rtn(float16 data, size_t offset, __private half *p); | ||
| 3194 | -#ifdef cl_khr_fp64 | ||
| 3195 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3196 | void __ovld vstore_half2(double2 data, size_t offset, __global half *p); | ||
| 3197 | void __ovld vstore_half3(double3 data, size_t offset, __global half *p); | ||
| 3198 | void __ovld vstore_half4(double4 data, size_t offset, __global half *p); | ||
| 3199 | @@ -12145,8 +12153,7 @@ void __ovld vstore_half3_rtn(double3 data, size_t offset, __private half *p); | ||
| 3200 | void __ovld vstore_half4_rtn(double4 data, size_t offset, __private half *p); | ||
| 3201 | void __ovld vstore_half8_rtn(double8 data, size_t offset, __private half *p); | ||
| 3202 | void __ovld vstore_half16_rtn(double16 data, size_t offset, __private half *p); | ||
| 3203 | -#endif //cl_khr_fp64 | ||
| 3204 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3205 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3206 | |||
| 3207 | /** | ||
| 3208 | * For n = 1, 2, 4, 8 and 16 read sizeof (halfn) | ||
| 3209 | @@ -12167,14 +12174,14 @@ float3 __ovld vloada_half3(size_t offset, const __constant half *p); | ||
| 3210 | float4 __ovld vloada_half4(size_t offset, const __constant half *p); | ||
| 3211 | float8 __ovld vloada_half8(size_t offset, const __constant half *p); | ||
| 3212 | float16 __ovld vloada_half16(size_t offset, const __constant half *p); | ||
| 3213 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3214 | +#ifdef __opencl_c_generic_address_space | ||
| 3215 | float __ovld vloada_half(size_t offset, const half *p); | ||
| 3216 | float2 __ovld vloada_half2(size_t offset, const half *p); | ||
| 3217 | float3 __ovld vloada_half3(size_t offset, const half *p); | ||
| 3218 | float4 __ovld vloada_half4(size_t offset, const half *p); | ||
| 3219 | float8 __ovld vloada_half8(size_t offset, const half *p); | ||
| 3220 | float16 __ovld vloada_half16(size_t offset, const half *p); | ||
| 3221 | -#else | ||
| 3222 | +#endif //__opencl_c_generic_address_space | ||
| 3223 | float __ovld vloada_half(size_t offset, const __global half *p); | ||
| 3224 | float2 __ovld vloada_half2(size_t offset, const __global half *p); | ||
| 3225 | float3 __ovld vloada_half3(size_t offset, const __global half *p); | ||
| 3226 | @@ -12193,7 +12200,6 @@ float3 __ovld vloada_half3(size_t offset, const __private half *p); | ||
| 3227 | float4 __ovld vloada_half4(size_t offset, const __private half *p); | ||
| 3228 | float8 __ovld vloada_half8(size_t offset, const __private half *p); | ||
| 3229 | float16 __ovld vloada_half16(size_t offset, const __private half *p); | ||
| 3230 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3231 | |||
| 3232 | /** | ||
| 3233 | * The floatn value given by data is converted to | ||
| 3234 | @@ -12211,7 +12217,7 @@ float16 __ovld vloada_half16(size_t offset, const __private half *p); | ||
| 3235 | * mode. The default current rounding mode is | ||
| 3236 | * round to nearest even. | ||
| 3237 | */ | ||
| 3238 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3239 | +#ifdef __opencl_c_generic_address_space | ||
| 3240 | void __ovld vstorea_half(float data, size_t offset, half *p); | ||
| 3241 | void __ovld vstorea_half2(float2 data, size_t offset, half *p); | ||
| 3242 | void __ovld vstorea_half3(float3 data, size_t offset, half *p); | ||
| 3243 | @@ -12247,7 +12253,7 @@ void __ovld vstorea_half4_rtn(float4 data, size_t offset, half *p); | ||
| 3244 | void __ovld vstorea_half8_rtn(float8 data, size_t offset, half *p); | ||
| 3245 | void __ovld vstorea_half16_rtn(float16 data, size_t offset, half *p); | ||
| 3246 | |||
| 3247 | -#ifdef cl_khr_fp64 | ||
| 3248 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3249 | void __ovld vstorea_half(double data, size_t offset, half *p); | ||
| 3250 | void __ovld vstorea_half2(double2 data, size_t offset, half *p); | ||
| 3251 | void __ovld vstorea_half3(double3 data, size_t offset, half *p); | ||
| 3252 | @@ -12282,9 +12288,9 @@ void __ovld vstorea_half3_rtn(double3 data, size_t offset, half *p); | ||
| 3253 | void __ovld vstorea_half4_rtn(double4 data, size_t offset, half *p); | ||
| 3254 | void __ovld vstorea_half8_rtn(double8 data, size_t offset, half *p); | ||
| 3255 | void __ovld vstorea_half16_rtn(double16 data, size_t offset, half *p); | ||
| 3256 | -#endif //cl_khr_fp64 | ||
| 3257 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3258 | +#endif //__opencl_c_generic_address_space | ||
| 3259 | |||
| 3260 | -#else | ||
| 3261 | void __ovld vstorea_half(float data, size_t offset, __global half *p); | ||
| 3262 | void __ovld vstorea_half2(float2 data, size_t offset, __global half *p); | ||
| 3263 | void __ovld vstorea_half3(float3 data, size_t offset, __global half *p); | ||
| 3264 | @@ -12390,7 +12396,7 @@ void __ovld vstorea_half4_rtn(float4 data, size_t offset, __private half *p); | ||
| 3265 | void __ovld vstorea_half8_rtn(float8 data, size_t offset, __private half *p); | ||
| 3266 | void __ovld vstorea_half16_rtn(float16 data, size_t offset, __private half *p); | ||
| 3267 | |||
| 3268 | -#ifdef cl_khr_fp64 | ||
| 3269 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3270 | void __ovld vstorea_half(double data, size_t offset, __global half *p); | ||
| 3271 | void __ovld vstorea_half2(double2 data, size_t offset, __global half *p); | ||
| 3272 | void __ovld vstorea_half3(double3 data, size_t offset, __global half *p); | ||
| 3273 | @@ -12495,8 +12501,7 @@ void __ovld vstorea_half3_rtn(double3 data,size_t offset, __private half *p); | ||
| 3274 | void __ovld vstorea_half4_rtn(double4 data,size_t offset, __private half *p); | ||
| 3275 | void __ovld vstorea_half8_rtn(double8 data,size_t offset, __private half *p); | ||
| 3276 | void __ovld vstorea_half16_rtn(double16 data,size_t offset, __private half *p); | ||
| 3277 | -#endif //cl_khr_fp64 | ||
| 3278 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3279 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3280 | |||
| 3281 | // OpenCL v1.1 s6.11.8, v1.2 s6.12.8, v2.0 s6.13.8 - Synchronization Functions | ||
| 3282 | |||
| 3283 | @@ -12580,7 +12585,7 @@ void __ovld write_mem_fence(cl_mem_fence_flags flags); | ||
| 3284 | |||
| 3285 | // OpenCL v2.0 s6.13.9 - Address Space Qualifier Functions | ||
| 3286 | |||
| 3287 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3288 | +#ifdef __opencl_c_generic_address_space | ||
| 3289 | cl_mem_fence_flags __ovld get_fence(const void *ptr); | ||
| 3290 | cl_mem_fence_flags __ovld get_fence(void *ptr); | ||
| 3291 | |||
| 3292 | @@ -12591,7 +12596,7 @@ cl_mem_fence_flags __ovld get_fence(void *ptr); | ||
| 3293 | * where gentype is builtin type or user defined type. | ||
| 3294 | */ | ||
| 3295 | |||
| 3296 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3297 | +#endif //__opencl_c_generic_address_space | ||
| 3298 | |||
| 3299 | // OpenCL v1.1 s6.11.10, v1.2 s6.12.10, v2.0 s6.13.10 - Async Copies from Global to Local Memory, Local to Global Memory, and Prefetch | ||
| 3300 | |||
| 3301 | @@ -12730,7 +12735,7 @@ event_t __ovld async_work_group_copy(__global uint16 *dst, const __local uint16 | ||
| 3302 | event_t __ovld async_work_group_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, event_t event); | ||
| 3303 | event_t __ovld async_work_group_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, event_t event); | ||
| 3304 | event_t __ovld async_work_group_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, event_t event); | ||
| 3305 | -#ifdef cl_khr_fp64 | ||
| 3306 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3307 | event_t __ovld async_work_group_copy(__local double *dst, const __global double *src, size_t num_elements, event_t event); | ||
| 3308 | event_t __ovld async_work_group_copy(__local double2 *dst, const __global double2 *src, size_t num_elements, event_t event); | ||
| 3309 | event_t __ovld async_work_group_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, event_t event); | ||
| 3310 | @@ -12743,7 +12748,7 @@ event_t __ovld async_work_group_copy(__global double3 *dst, const __local double | ||
| 3311 | event_t __ovld async_work_group_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, event_t event); | ||
| 3312 | event_t __ovld async_work_group_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, event_t event); | ||
| 3313 | event_t __ovld async_work_group_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, event_t event); | ||
| 3314 | -#endif //cl_khr_fp64 | ||
| 3315 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3316 | #ifdef cl_khr_fp16 | ||
| 3317 | event_t __ovld async_work_group_copy(__local half *dst, const __global half *src, size_t num_elements, event_t event); | ||
| 3318 | event_t __ovld async_work_group_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, event_t event); | ||
| 3319 | @@ -12893,7 +12898,7 @@ event_t __ovld async_work_group_strided_copy(__global uint16 *dst, const __local | ||
| 3320 | event_t __ovld async_work_group_strided_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3321 | event_t __ovld async_work_group_strided_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3322 | event_t __ovld async_work_group_strided_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3323 | -#ifdef cl_khr_fp64 | ||
| 3324 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3325 | event_t __ovld async_work_group_strided_copy(__local double *dst, const __global double *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3326 | event_t __ovld async_work_group_strided_copy(__local double2 *dst, const __global double2 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3327 | event_t __ovld async_work_group_strided_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3328 | @@ -12906,7 +12911,7 @@ event_t __ovld async_work_group_strided_copy(__global double3 *dst, const __loca | ||
| 3329 | event_t __ovld async_work_group_strided_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3330 | event_t __ovld async_work_group_strided_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3331 | event_t __ovld async_work_group_strided_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3332 | -#endif //cl_khr_fp64 | ||
| 3333 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3334 | #ifdef cl_khr_fp16 | ||
| 3335 | event_t __ovld async_work_group_strided_copy(__local half *dst, const __global half *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3336 | event_t __ovld async_work_group_strided_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3337 | @@ -12996,14 +13001,14 @@ void __ovld prefetch(const __global uint16 *p, size_t num_elements); | ||
| 3338 | void __ovld prefetch(const __global long16 *p, size_t num_elements); | ||
| 3339 | void __ovld prefetch(const __global ulong16 *p, size_t num_elements); | ||
| 3340 | void __ovld prefetch(const __global float16 *p, size_t num_elements); | ||
| 3341 | -#ifdef cl_khr_fp64 | ||
| 3342 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3343 | void __ovld prefetch(const __global double *p, size_t num_elements); | ||
| 3344 | void __ovld prefetch(const __global double2 *p, size_t num_elements); | ||
| 3345 | void __ovld prefetch(const __global double3 *p, size_t num_elements); | ||
| 3346 | void __ovld prefetch(const __global double4 *p, size_t num_elements); | ||
| 3347 | void __ovld prefetch(const __global double8 *p, size_t num_elements); | ||
| 3348 | void __ovld prefetch(const __global double16 *p, size_t num_elements); | ||
| 3349 | -#endif //cl_khr_fp64 | ||
| 3350 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3351 | #ifdef cl_khr_fp16 | ||
| 3352 | void __ovld prefetch(const __global half *p, size_t num_elements); | ||
| 3353 | void __ovld prefetch(const __global half2 *p, size_t num_elements); | ||
| 3354 | @@ -13026,9 +13031,11 @@ void __ovld prefetch(const __global half16 *p, size_t num_elements); | ||
| 3355 | * pointed by p. The function returns old. | ||
| 3356 | */ | ||
| 3357 | int __ovld atomic_add(volatile __global int *p, int val); | ||
| 3358 | -unsigned int __ovld atomic_add(volatile __global unsigned int *p, unsigned int val); | ||
| 3359 | +unsigned int __ovld atomic_add(volatile __global unsigned int *p, | ||
| 3360 | + unsigned int val); | ||
| 3361 | int __ovld atomic_add(volatile __local int *p, int val); | ||
| 3362 | -unsigned int __ovld atomic_add(volatile __local unsigned int *p, unsigned int val); | ||
| 3363 | +unsigned int __ovld atomic_add(volatile __local unsigned int *p, | ||
| 3364 | + unsigned int val); | ||
| 3365 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3366 | int __ovld atomic_add(volatile int *p, int val); | ||
| 3367 | unsigned int __ovld atomic_add(volatile unsigned int *p, unsigned int val); | ||
| 3368 | @@ -13056,9 +13063,11 @@ unsigned long __ovld atom_add(volatile __local unsigned long *p, unsigned long v | ||
| 3369 | * returns old. | ||
| 3370 | */ | ||
| 3371 | int __ovld atomic_sub(volatile __global int *p, int val); | ||
| 3372 | -unsigned int __ovld atomic_sub(volatile __global unsigned int *p, unsigned int val); | ||
| 3373 | +unsigned int __ovld atomic_sub(volatile __global unsigned int *p, | ||
| 3374 | + unsigned int val); | ||
| 3375 | int __ovld atomic_sub(volatile __local int *p, int val); | ||
| 3376 | -unsigned int __ovld atomic_sub(volatile __local unsigned int *p, unsigned int val); | ||
| 3377 | +unsigned int __ovld atomic_sub(volatile __local unsigned int *p, | ||
| 3378 | + unsigned int val); | ||
| 3379 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3380 | int __ovld atomic_sub(volatile int *p, int val); | ||
| 3381 | unsigned int __ovld atomic_sub(volatile unsigned int *p, unsigned int val); | ||
| 3382 | @@ -13086,9 +13095,11 @@ unsigned long __ovld atom_sub(volatile __local unsigned long *p, unsigned long v | ||
| 3383 | * value. | ||
| 3384 | */ | ||
| 3385 | int __ovld atomic_xchg(volatile __global int *p, int val); | ||
| 3386 | -unsigned int __ovld atomic_xchg(volatile __global unsigned int *p, unsigned int val); | ||
| 3387 | +unsigned int __ovld atomic_xchg(volatile __global unsigned int *p, | ||
| 3388 | + unsigned int val); | ||
| 3389 | int __ovld atomic_xchg(volatile __local int *p, int val); | ||
| 3390 | -unsigned int __ovld atomic_xchg(volatile __local unsigned int *p, unsigned int val); | ||
| 3391 | +unsigned int __ovld atomic_xchg(volatile __local unsigned int *p, | ||
| 3392 | + unsigned int val); | ||
| 3393 | float __ovld atomic_xchg(volatile __global float *p, float val); | ||
| 3394 | float __ovld atomic_xchg(volatile __local float *p, float val); | ||
| 3395 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3396 | @@ -13183,12 +13194,15 @@ unsigned long __ovld atom_dec(volatile __local unsigned long *p); | ||
| 3397 | * returns old. | ||
| 3398 | */ | ||
| 3399 | int __ovld atomic_cmpxchg(volatile __global int *p, int cmp, int val); | ||
| 3400 | -unsigned int __ovld atomic_cmpxchg(volatile __global unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3401 | +unsigned int __ovld atomic_cmpxchg(volatile __global unsigned int *p, | ||
| 3402 | + unsigned int cmp, unsigned int val); | ||
| 3403 | int __ovld atomic_cmpxchg(volatile __local int *p, int cmp, int val); | ||
| 3404 | -unsigned int __ovld atomic_cmpxchg(volatile __local unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3405 | +unsigned int __ovld atomic_cmpxchg(volatile __local unsigned int *p, | ||
| 3406 | + unsigned int cmp, unsigned int val); | ||
| 3407 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3408 | int __ovld atomic_cmpxchg(volatile int *p, int cmp, int val); | ||
| 3409 | -unsigned int __ovld atomic_cmpxchg(volatile unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3410 | +unsigned int __ovld atomic_cmpxchg(volatile unsigned int *p, unsigned int cmp, | ||
| 3411 | + unsigned int val); | ||
| 3412 | #endif | ||
| 3413 | |||
| 3414 | #if defined(cl_khr_global_int32_base_atomics) | ||
| 3415 | @@ -13215,9 +13229,11 @@ unsigned long __ovld atom_cmpxchg(volatile __local unsigned long *p, unsigned lo | ||
| 3416 | * returns old. | ||
| 3417 | */ | ||
| 3418 | int __ovld atomic_min(volatile __global int *p, int val); | ||
| 3419 | -unsigned int __ovld atomic_min(volatile __global unsigned int *p, unsigned int val); | ||
| 3420 | +unsigned int __ovld atomic_min(volatile __global unsigned int *p, | ||
| 3421 | + unsigned int val); | ||
| 3422 | int __ovld atomic_min(volatile __local int *p, int val); | ||
| 3423 | -unsigned int __ovld atomic_min(volatile __local unsigned int *p, unsigned int val); | ||
| 3424 | +unsigned int __ovld atomic_min(volatile __local unsigned int *p, | ||
| 3425 | + unsigned int val); | ||
| 3426 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3427 | int __ovld atomic_min(volatile int *p, int val); | ||
| 3428 | unsigned int __ovld atomic_min(volatile unsigned int *p, unsigned int val); | ||
| 3429 | @@ -13247,9 +13263,11 @@ unsigned long __ovld atom_min(volatile __local unsigned long *p, unsigned long v | ||
| 3430 | * returns old. | ||
| 3431 | */ | ||
| 3432 | int __ovld atomic_max(volatile __global int *p, int val); | ||
| 3433 | -unsigned int __ovld atomic_max(volatile __global unsigned int *p, unsigned int val); | ||
| 3434 | +unsigned int __ovld atomic_max(volatile __global unsigned int *p, | ||
| 3435 | + unsigned int val); | ||
| 3436 | int __ovld atomic_max(volatile __local int *p, int val); | ||
| 3437 | -unsigned int __ovld atomic_max(volatile __local unsigned int *p, unsigned int val); | ||
| 3438 | +unsigned int __ovld atomic_max(volatile __local unsigned int *p, | ||
| 3439 | + unsigned int val); | ||
| 3440 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3441 | int __ovld atomic_max(volatile int *p, int val); | ||
| 3442 | unsigned int __ovld atomic_max(volatile unsigned int *p, unsigned int val); | ||
| 3443 | @@ -13278,9 +13296,11 @@ unsigned long __ovld atom_max(volatile __local unsigned long *p, unsigned long v | ||
| 3444 | * pointed by p. The function returns old. | ||
| 3445 | */ | ||
| 3446 | int __ovld atomic_and(volatile __global int *p, int val); | ||
| 3447 | -unsigned int __ovld atomic_and(volatile __global unsigned int *p, unsigned int val); | ||
| 3448 | +unsigned int __ovld atomic_and(volatile __global unsigned int *p, | ||
| 3449 | + unsigned int val); | ||
| 3450 | int __ovld atomic_and(volatile __local int *p, int val); | ||
| 3451 | -unsigned int __ovld atomic_and(volatile __local unsigned int *p, unsigned int val); | ||
| 3452 | +unsigned int __ovld atomic_and(volatile __local unsigned int *p, | ||
| 3453 | + unsigned int val); | ||
| 3454 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3455 | int __ovld atomic_and(volatile int *p, int val); | ||
| 3456 | unsigned int __ovld atomic_and(volatile unsigned int *p, unsigned int val); | ||
| 3457 | @@ -13309,9 +13329,11 @@ unsigned long __ovld atom_and(volatile __local unsigned long *p, unsigned long v | ||
| 3458 | * pointed by p. The function returns old. | ||
| 3459 | */ | ||
| 3460 | int __ovld atomic_or(volatile __global int *p, int val); | ||
| 3461 | -unsigned int __ovld atomic_or(volatile __global unsigned int *p, unsigned int val); | ||
| 3462 | +unsigned int __ovld atomic_or(volatile __global unsigned int *p, | ||
| 3463 | + unsigned int val); | ||
| 3464 | int __ovld atomic_or(volatile __local int *p, int val); | ||
| 3465 | -unsigned int __ovld atomic_or(volatile __local unsigned int *p, unsigned int val); | ||
| 3466 | +unsigned int __ovld atomic_or(volatile __local unsigned int *p, | ||
| 3467 | + unsigned int val); | ||
| 3468 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3469 | int __ovld atomic_or(volatile int *p, int val); | ||
| 3470 | unsigned int __ovld atomic_or(volatile unsigned int *p, unsigned int val); | ||
| 3471 | @@ -13340,9 +13362,11 @@ unsigned long __ovld atom_or(volatile __local unsigned long *p, unsigned long va | ||
| 3472 | * pointed by p. The function returns old. | ||
| 3473 | */ | ||
| 3474 | int __ovld atomic_xor(volatile __global int *p, int val); | ||
| 3475 | -unsigned int __ovld atomic_xor(volatile __global unsigned int *p, unsigned int val); | ||
| 3476 | +unsigned int __ovld atomic_xor(volatile __global unsigned int *p, | ||
| 3477 | + unsigned int val); | ||
| 3478 | int __ovld atomic_xor(volatile __local int *p, int val); | ||
| 3479 | -unsigned int __ovld atomic_xor(volatile __local unsigned int *p, unsigned int val); | ||
| 3480 | +unsigned int __ovld atomic_xor(volatile __local unsigned int *p, | ||
| 3481 | + unsigned int val); | ||
| 3482 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3483 | int __ovld atomic_xor(volatile int *p, int val); | ||
| 3484 | unsigned int __ovld atomic_xor(volatile unsigned int *p, unsigned int val); | ||
| 3485 | @@ -13380,120 +13404,78 @@ unsigned long __ovld atom_xor(volatile __local unsigned long *p, unsigned long v | ||
| 3486 | #endif | ||
| 3487 | |||
| 3488 | // atomic_init() | ||
| 3489 | +#ifdef __opencl_c_generic_address_space | ||
| 3490 | void __ovld atomic_init(volatile atomic_int *object, int value); | ||
| 3491 | void __ovld atomic_init(volatile atomic_uint *object, uint value); | ||
| 3492 | void __ovld atomic_init(volatile atomic_float *object, float value); | ||
| 3493 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3494 | void __ovld atomic_init(volatile atomic_long *object, long value); | ||
| 3495 | void __ovld atomic_init(volatile atomic_ulong *object, ulong value); | ||
| 3496 | -#ifdef cl_khr_fp64 | ||
| 3497 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3498 | void __ovld atomic_init(volatile atomic_double *object, double value); | ||
| 3499 | -#endif //cl_khr_fp64 | ||
| 3500 | -#endif | ||
| 3501 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3502 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3503 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3504 | +#endif // __opencl_c_generic_address_space | ||
| 3505 | + | ||
| 3506 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3507 | +void __ovld atomic_init(volatile atomic_int __global *object, int value); | ||
| 3508 | +void __ovld atomic_init(volatile atomic_int __local *object, int value); | ||
| 3509 | +void __ovld atomic_init(volatile atomic_uint __global *object, uint value); | ||
| 3510 | +void __ovld atomic_init(volatile atomic_uint __local *object, uint value); | ||
| 3511 | +void __ovld atomic_init(volatile atomic_float __global *object, float value); | ||
| 3512 | +void __ovld atomic_init(volatile atomic_float __local *object, float value); | ||
| 3513 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3514 | +void __ovld atomic_init(volatile atomic_long __global *object, long value); | ||
| 3515 | +void __ovld atomic_init(volatile atomic_long __local *object, long value); | ||
| 3516 | +void __ovld atomic_init(volatile atomic_ulong __global *object, ulong value); | ||
| 3517 | +void __ovld atomic_init(volatile atomic_ulong __local *object, ulong value); | ||
| 3518 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3519 | +void __ovld atomic_init(volatile atomic_double __global *object, double value); | ||
| 3520 | +void __ovld atomic_init(volatile atomic_double __local *object, double value); | ||
| 3521 | +#endif // cl_khr_fp64 | ||
| 3522 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3523 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3524 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3525 | |||
| 3526 | // atomic_work_item_fence() | ||
| 3527 | -void __ovld atomic_work_item_fence(cl_mem_fence_flags flags, memory_order order, memory_scope scope); | ||
| 3528 | +void __ovld atomic_work_item_fence(cl_mem_fence_flags flags, memory_order order, | ||
| 3529 | + memory_scope scope); | ||
| 3530 | |||
| 3531 | // atomic_fetch() | ||
| 3532 | - | ||
| 3533 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 3534 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 3535 | +#ifdef __opencl_c_generic_address_space | ||
| 3536 | int __ovld atomic_fetch_add(volatile atomic_int *object, int operand); | ||
| 3537 | -int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3538 | -int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3539 | uint __ovld atomic_fetch_add(volatile atomic_uint *object, uint operand); | ||
| 3540 | -uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3541 | -uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3542 | int __ovld atomic_fetch_sub(volatile atomic_int *object, int operand); | ||
| 3543 | -int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3544 | -int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3545 | uint __ovld atomic_fetch_sub(volatile atomic_uint *object, uint operand); | ||
| 3546 | -uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3547 | -uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3548 | int __ovld atomic_fetch_or(volatile atomic_int *object, int operand); | ||
| 3549 | -int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3550 | -int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3551 | uint __ovld atomic_fetch_or(volatile atomic_uint *object, uint operand); | ||
| 3552 | -uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3553 | -uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3554 | int __ovld atomic_fetch_xor(volatile atomic_int *object, int operand); | ||
| 3555 | -int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3556 | -int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3557 | uint __ovld atomic_fetch_xor(volatile atomic_uint *object, uint operand); | ||
| 3558 | -uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3559 | -uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3560 | int __ovld atomic_fetch_and(volatile atomic_int *object, int operand); | ||
| 3561 | -int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3562 | -int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3563 | uint __ovld atomic_fetch_and(volatile atomic_uint *object, uint operand); | ||
| 3564 | -uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3565 | -uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3566 | int __ovld atomic_fetch_min(volatile atomic_int *object, int operand); | ||
| 3567 | -int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3568 | -int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3569 | uint __ovld atomic_fetch_min(volatile atomic_uint *object, uint operand); | ||
| 3570 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3571 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3572 | -uint __ovld atomic_fetch_min(volatile atomic_uint *object, int operand); | ||
| 3573 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, int operand, memory_order order); | ||
| 3574 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, int operand, memory_order order, memory_scope scope); | ||
| 3575 | int __ovld atomic_fetch_max(volatile atomic_int *object, int operand); | ||
| 3576 | -int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3577 | -int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3578 | uint __ovld atomic_fetch_max(volatile atomic_uint *object, uint operand); | ||
| 3579 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3580 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3581 | -uint __ovld atomic_fetch_max(volatile atomic_uint *object, int operand); | ||
| 3582 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, int operand, memory_order order); | ||
| 3583 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, int operand, memory_order order, memory_scope scope); | ||
| 3584 | |||
| 3585 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3586 | long __ovld atomic_fetch_add(volatile atomic_long *object, long operand); | ||
| 3587 | -long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3588 | -long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3589 | ulong __ovld atomic_fetch_add(volatile atomic_ulong *object, ulong operand); | ||
| 3590 | -ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3591 | -ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3592 | long __ovld atomic_fetch_sub(volatile atomic_long *object, long operand); | ||
| 3593 | -long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3594 | -long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3595 | ulong __ovld atomic_fetch_sub(volatile atomic_ulong *object, ulong operand); | ||
| 3596 | -ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3597 | -ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3598 | long __ovld atomic_fetch_or(volatile atomic_long *object, long operand); | ||
| 3599 | -long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3600 | -long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3601 | ulong __ovld atomic_fetch_or(volatile atomic_ulong *object, ulong operand); | ||
| 3602 | -ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3603 | -ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3604 | long __ovld atomic_fetch_xor(volatile atomic_long *object, long operand); | ||
| 3605 | -long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3606 | -long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3607 | ulong __ovld atomic_fetch_xor(volatile atomic_ulong *object, ulong operand); | ||
| 3608 | -ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3609 | -ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3610 | long __ovld atomic_fetch_and(volatile atomic_long *object, long operand); | ||
| 3611 | -long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3612 | -long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3613 | ulong __ovld atomic_fetch_and(volatile atomic_ulong *object, ulong operand); | ||
| 3614 | -ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3615 | -ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3616 | long __ovld atomic_fetch_min(volatile atomic_long *object, long operand); | ||
| 3617 | -long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3618 | -long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3619 | ulong __ovld atomic_fetch_min(volatile atomic_ulong *object, ulong operand); | ||
| 3620 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3621 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3622 | -ulong __ovld atomic_fetch_min(volatile atomic_ulong *object, long operand); | ||
| 3623 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, long operand, memory_order order); | ||
| 3624 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, long operand, memory_order order, memory_scope scope); | ||
| 3625 | long __ovld atomic_fetch_max(volatile atomic_long *object, long operand); | ||
| 3626 | -long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3627 | -long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3628 | ulong __ovld atomic_fetch_max(volatile atomic_ulong *object, ulong operand); | ||
| 3629 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3630 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3631 | -ulong __ovld atomic_fetch_max(volatile atomic_ulong *object, long operand); | ||
| 3632 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, long operand, memory_order order); | ||
| 3633 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, long operand, memory_order order, memory_scope scope); | ||
| 3634 | #endif //defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3635 | |||
| 3636 | // OpenCL v2.0 s6.13.11.7.5: | ||
| 3637 | @@ -13501,196 +13483,2239 @@ ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, long opera | ||
| 3638 | // or/xor/and/min/max: atomic type argument can be intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 3639 | |||
| 3640 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3641 | -uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t *object, ptrdiff_t operand); | ||
| 3642 | -uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order); | ||
| 3643 | -uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order, memory_scope scope); | ||
| 3644 | -uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t *object, ptrdiff_t operand); | ||
| 3645 | -uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order); | ||
| 3646 | -uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order, memory_scope scope); | ||
| 3647 | - | ||
| 3648 | -uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3649 | -uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3650 | -uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3651 | -uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3652 | -uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3653 | -uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3654 | -uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3655 | -uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3656 | -uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3657 | -uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t *object, intptr_t opermax); | ||
| 3658 | -uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder); | ||
| 3659 | -uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3660 | -uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t *object, intptr_t opermax); | ||
| 3661 | -uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder); | ||
| 3662 | -uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3663 | - | ||
| 3664 | -intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3665 | -intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3666 | -intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3667 | -intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3668 | -intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3669 | -intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3670 | -intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3671 | -intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3672 | -intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3673 | -intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t *object, uintptr_t opermax); | ||
| 3674 | -intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder); | ||
| 3675 | -intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3676 | -intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t *object, uintptr_t opermax); | ||
| 3677 | -intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder); | ||
| 3678 | -intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3679 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t *object, | ||
| 3680 | + ptrdiff_t operand); | ||
| 3681 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t *object, | ||
| 3682 | + ptrdiff_t operand); | ||
| 3683 | + | ||
| 3684 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t *object, | ||
| 3685 | + intptr_t operand); | ||
| 3686 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t *object, | ||
| 3687 | + intptr_t operand); | ||
| 3688 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t *object, | ||
| 3689 | + intptr_t operand); | ||
| 3690 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t *object, | ||
| 3691 | + intptr_t opermax); | ||
| 3692 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t *object, | ||
| 3693 | + intptr_t opermax); | ||
| 3694 | + | ||
| 3695 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t *object, | ||
| 3696 | + uintptr_t operand); | ||
| 3697 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t *object, | ||
| 3698 | + uintptr_t operand); | ||
| 3699 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t *object, | ||
| 3700 | + uintptr_t operand); | ||
| 3701 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t *object, | ||
| 3702 | + uintptr_t opermax); | ||
| 3703 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t *object, | ||
| 3704 | + uintptr_t opermax); | ||
| 3705 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3706 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3707 | +#endif // __opencl_c_generic_address_space | ||
| 3708 | + | ||
| 3709 | +#if(__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3710 | +int __ovld atomic_fetch_add(volatile atomic_int __global *object, int operand); | ||
| 3711 | +uint __ovld atomic_fetch_add(volatile atomic_uint __local *object, | ||
| 3712 | + uint operand); | ||
| 3713 | +int __ovld atomic_fetch_sub(volatile atomic_int __global *object, int operand); | ||
| 3714 | +int __ovld atomic_fetch_sub(volatile atomic_int __local *object, int operand); | ||
| 3715 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __local *object, | ||
| 3716 | + uint operand); | ||
| 3717 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __global *object, | ||
| 3718 | + uint operand); | ||
| 3719 | +int __ovld atomic_fetch_or(volatile atomic_int __global *object, int operand); | ||
| 3720 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __local *object, | ||
| 3721 | + uint operand); | ||
| 3722 | +uint __ovld atomic_fetch_or(volatile atomic_uint __global *object, | ||
| 3723 | + uint operand); | ||
| 3724 | +uint __ovld atomic_fetch_or(volatile atomic_uint __local *object, uint operand); | ||
| 3725 | +int __ovld atomic_fetch_xor(volatile atomic_int __global *object, int operand); | ||
| 3726 | +int __ovld atomic_fetch_xor(volatile atomic_int __local *object, int operand); | ||
| 3727 | +uint __ovld atomic_fetch_xor(volatile atomic_uint __global *object, | ||
| 3728 | + uint operand); | ||
| 3729 | +uint __ovld atomic_fetch_xor(volatile atomic_uint __local *object, | ||
| 3730 | + uint operand); | ||
| 3731 | +int __ovld atomic_fetch_and(volatile atomic_int __global *object, int operand); | ||
| 3732 | +int __ovld atomic_fetch_and(volatile atomic_int __local *object, int operand); | ||
| 3733 | +uint __ovld atomic_fetch_and(volatile atomic_uint __global *object, | ||
| 3734 | + uint operand); | ||
| 3735 | +uint __ovld atomic_fetch_and(volatile atomic_uint __local *object, | ||
| 3736 | + uint operand); | ||
| 3737 | +int __ovld atomic_fetch_min(volatile atomic_int __global *object, int operand); | ||
| 3738 | +int __ovld atomic_fetch_min(volatile atomic_int __local *object, int operand); | ||
| 3739 | +uint __ovld atomic_fetch_min(volatile atomic_uint __global *object, | ||
| 3740 | + uint operand); | ||
| 3741 | +uint __ovld atomic_fetch_min(volatile atomic_uint __local *object, | ||
| 3742 | + uint operand); | ||
| 3743 | +int __ovld atomic_fetch_max(volatile atomic_int __global *object, int operand); | ||
| 3744 | +int __ovld atomic_fetch_max(volatile atomic_int __local *object, int operand); | ||
| 3745 | +uint __ovld atomic_fetch_max(volatile atomic_uint __global *object, | ||
| 3746 | + uint operand); | ||
| 3747 | +uint __ovld atomic_fetch_max(volatile atomic_uint __local *object, | ||
| 3748 | + uint operand); | ||
| 3749 | + | ||
| 3750 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3751 | +long __ovld atomic_fetch_add(volatile atomic_long __global *object, | ||
| 3752 | + long operand); | ||
| 3753 | +long __ovld atomic_fetch_add(volatile atomic_long __local *object, | ||
| 3754 | + long operand); | ||
| 3755 | +ulong __ovld atomic_fetch_add(volatile atomic_ulong __global *object, | ||
| 3756 | + ulong operand); | ||
| 3757 | +ulong __ovld atomic_fetch_add(volatile atomic_ulong __local *object, | ||
| 3758 | + ulong operand); | ||
| 3759 | +long __ovld atomic_fetch_sub(volatile atomic_long __global *object, | ||
| 3760 | + long operand); | ||
| 3761 | +long __ovld atomic_fetch_sub(volatile atomic_long __local *object, | ||
| 3762 | + long operand); | ||
| 3763 | +ulong __ovld atomic_fetch_sub(volatile atomic_ulong __global *object, | ||
| 3764 | + ulong operand); | ||
| 3765 | +ulong __ovld atomic_fetch_sub(volatile atomic_ulong __local *object, | ||
| 3766 | + ulong operand); | ||
| 3767 | +long __ovld atomic_fetch_or(volatile atomic_long __global *object, | ||
| 3768 | + long operand); | ||
| 3769 | +long __ovld atomic_fetch_or(volatile atomic_long __local *object, long operand); | ||
| 3770 | +ulong __ovld atomic_fetch_or(volatile atomic_ulong __global *object, | ||
| 3771 | + ulong operand); | ||
| 3772 | +ulong __ovld atomic_fetch_or(volatile atomic_ulong __local *object, | ||
| 3773 | + ulong operand); | ||
| 3774 | +long __ovld atomic_fetch_xor(volatile atomic_long __global *object, | ||
| 3775 | + long operand); | ||
| 3776 | +long __ovld atomic_fetch_xor(volatile atomic_long __local *object, | ||
| 3777 | + long operand); | ||
| 3778 | +ulong __ovld atomic_fetch_xor(volatile atomic_ulong __global *object, | ||
| 3779 | + ulong operand); | ||
| 3780 | +ulong __ovld atomic_fetch_xor(volatile atomic_ulong __local *object, | ||
| 3781 | + ulong operand); | ||
| 3782 | +long __ovld atomic_fetch_and(volatile atomic_long __global *object, | ||
| 3783 | + long operand); | ||
| 3784 | +long __ovld atomic_fetch_and(volatile atomic_long __local *object, | ||
| 3785 | + long operand); | ||
| 3786 | +ulong __ovld atomic_fetch_and(volatile atomic_ulong __global *object, | ||
| 3787 | + ulong operand); | ||
| 3788 | +ulong __ovld atomic_fetch_and(volatile atomic_ulong __local *object, | ||
| 3789 | + ulong operand); | ||
| 3790 | +long __ovld atomic_fetch_min(volatile atomic_long __global *object, | ||
| 3791 | + long operand); | ||
| 3792 | +long __ovld atomic_fetch_min(volatile atomic_long __local *object, | ||
| 3793 | + long operand); | ||
| 3794 | +ulong __ovld atomic_fetch_min(volatile atomic_ulong __global *object, | ||
| 3795 | + ulong operand); | ||
| 3796 | +ulong __ovld atomic_fetch_min(volatile atomic_ulong __local *object, | ||
| 3797 | + ulong operand); | ||
| 3798 | +long __ovld atomic_fetch_max(volatile atomic_long __global *object, | ||
| 3799 | + long operand); | ||
| 3800 | +long __ovld atomic_fetch_max(volatile atomic_long __local *object, | ||
| 3801 | + long operand); | ||
| 3802 | +ulong __ovld atomic_fetch_max(volatile atomic_ulong __global *object, | ||
| 3803 | + ulong operand); | ||
| 3804 | +ulong __ovld atomic_fetch_max(volatile atomic_ulong __local *object, | ||
| 3805 | + ulong operand); | ||
| 3806 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3807 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3808 | + | ||
| 3809 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 3810 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 3811 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 3812 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 3813 | + | ||
| 3814 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3815 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t __global *object, | ||
| 3816 | + ptrdiff_t operand); | ||
| 3817 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t __local *object, | ||
| 3818 | + ptrdiff_t operand); | ||
| 3819 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t __global *object, | ||
| 3820 | + ptrdiff_t operand); | ||
| 3821 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t __local *object, | ||
| 3822 | + ptrdiff_t operand); | ||
| 3823 | + | ||
| 3824 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t __global *object, | ||
| 3825 | + intptr_t operand); | ||
| 3826 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t __local *object, | ||
| 3827 | + intptr_t operand); | ||
| 3828 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t __global *object, | ||
| 3829 | + intptr_t operand); | ||
| 3830 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t __local *object, | ||
| 3831 | + intptr_t operand); | ||
| 3832 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t __global *object, | ||
| 3833 | + intptr_t operand); | ||
| 3834 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t __local *object, | ||
| 3835 | + intptr_t operand); | ||
| 3836 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t __global *object, | ||
| 3837 | + intptr_t opermax); | ||
| 3838 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t __local *object, | ||
| 3839 | + intptr_t opermax); | ||
| 3840 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t __global *object, | ||
| 3841 | + intptr_t opermax); | ||
| 3842 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t __local *object, | ||
| 3843 | + intptr_t opermax); | ||
| 3844 | + | ||
| 3845 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t __global *object, | ||
| 3846 | + uintptr_t operand); | ||
| 3847 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t __local *object, | ||
| 3848 | + uintptr_t operand); | ||
| 3849 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t __global *object, | ||
| 3850 | + uintptr_t operand); | ||
| 3851 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t __local *object, | ||
| 3852 | + uintptr_t operand); | ||
| 3853 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t __global *object, | ||
| 3854 | + uintptr_t operand); | ||
| 3855 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t __local *object, | ||
| 3856 | + uintptr_t operand); | ||
| 3857 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t __global *object, | ||
| 3858 | + uintptr_t opermax); | ||
| 3859 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t __local *object, | ||
| 3860 | + uintptr_t opermax); | ||
| 3861 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t __global *object, | ||
| 3862 | + uintptr_t opermax); | ||
| 3863 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t __local *object, | ||
| 3864 | + uintptr_t opermax); | ||
| 3865 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3866 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3867 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3868 | + | ||
| 3869 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 3870 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 3871 | + | ||
| 3872 | +#ifdef __opencl_c_generic_address_space | ||
| 3873 | +#ifdef __opencl_c_atomic_scope_device | ||
| 3874 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, | ||
| 3875 | + memory_order order); | ||
| 3876 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, | ||
| 3877 | + uint operand, memory_order order); | ||
| 3878 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, | ||
| 3879 | + memory_order order); | ||
| 3880 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, | ||
| 3881 | + uint operand, memory_order order); | ||
| 3882 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, | ||
| 3883 | + memory_order order); | ||
| 3884 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, | ||
| 3885 | + memory_order order); | ||
| 3886 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, | ||
| 3887 | + memory_order order); | ||
| 3888 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, | ||
| 3889 | + uint operand, memory_order order); | ||
| 3890 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, | ||
| 3891 | + memory_order order); | ||
| 3892 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, | ||
| 3893 | + uint operand, memory_order order); | ||
| 3894 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, | ||
| 3895 | + memory_order order); | ||
| 3896 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, | ||
| 3897 | + uint operand, memory_order order); | ||
| 3898 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, | ||
| 3899 | + memory_order order); | ||
| 3900 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, | ||
| 3901 | + uint operand, memory_order order); | ||
| 3902 | +#endif // __opencl_c_atomic_scope_device | ||
| 3903 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, | ||
| 3904 | + memory_order order, memory_scope scope); | ||
| 3905 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, | ||
| 3906 | + uint operand, memory_order order, | ||
| 3907 | + memory_scope scope); | ||
| 3908 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, | ||
| 3909 | + memory_order order, memory_scope scope); | ||
| 3910 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, | ||
| 3911 | + uint operand, memory_order order, | ||
| 3912 | + memory_scope scope); | ||
| 3913 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, | ||
| 3914 | + memory_order order, memory_scope scope); | ||
| 3915 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, | ||
| 3916 | + memory_order order, memory_scope scope); | ||
| 3917 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, | ||
| 3918 | + memory_order order, memory_scope scope); | ||
| 3919 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, | ||
| 3920 | + uint operand, memory_order order, | ||
| 3921 | + memory_scope scope); | ||
| 3922 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, | ||
| 3923 | + memory_order order, memory_scope scope); | ||
| 3924 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, | ||
| 3925 | + uint operand, memory_order order, | ||
| 3926 | + memory_scope scope); | ||
| 3927 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, | ||
| 3928 | + memory_order order, memory_scope scope); | ||
| 3929 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, | ||
| 3930 | + uint operand, memory_order order, | ||
| 3931 | + memory_scope scope); | ||
| 3932 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, | ||
| 3933 | + memory_order order, memory_scope scope); | ||
| 3934 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, | ||
| 3935 | + uint operand, memory_order order, | ||
| 3936 | + memory_scope scope); | ||
| 3937 | + | ||
| 3938 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3939 | +#ifdef __opencl_c_atomic_scope_device | ||
| 3940 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, | ||
| 3941 | + long operand, memory_order order); | ||
| 3942 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, | ||
| 3943 | + ulong operand, memory_order order); | ||
| 3944 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, | ||
| 3945 | + long operand, memory_order order); | ||
| 3946 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, | ||
| 3947 | + ulong operand, memory_order order); | ||
| 3948 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, | ||
| 3949 | + memory_order order); | ||
| 3950 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, | ||
| 3951 | + ulong operand, memory_order order); | ||
| 3952 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, | ||
| 3953 | + long operand, memory_order order); | ||
| 3954 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, | ||
| 3955 | + ulong operand, memory_order order); | ||
| 3956 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, | ||
| 3957 | + long operand, memory_order order); | ||
| 3958 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, | ||
| 3959 | + ulong operand, memory_order order); | ||
| 3960 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, | ||
| 3961 | + long operand, memory_order order); | ||
| 3962 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, | ||
| 3963 | + ulong operand, memory_order order); | ||
| 3964 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, | ||
| 3965 | + long operand, memory_order order); | ||
| 3966 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, | ||
| 3967 | + ulong operand, memory_order order); | ||
| 3968 | +#endif // __opencl_c_atomic_scope_device | ||
| 3969 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, | ||
| 3970 | + long operand, memory_order order, | ||
| 3971 | + memory_scope scope); | ||
| 3972 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, | ||
| 3973 | + ulong operand, memory_order order, | ||
| 3974 | + memory_scope scope); | ||
| 3975 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, | ||
| 3976 | + long operand, memory_order order, | ||
| 3977 | + memory_scope scope); | ||
| 3978 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, | ||
| 3979 | + ulong operand, memory_order order, | ||
| 3980 | + memory_scope scope); | ||
| 3981 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, | ||
| 3982 | + memory_order order, memory_scope scope); | ||
| 3983 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, | ||
| 3984 | + ulong operand, memory_order order, | ||
| 3985 | + memory_scope scope); | ||
| 3986 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, | ||
| 3987 | + long operand, memory_order order, | ||
| 3988 | + memory_scope scope); | ||
| 3989 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, | ||
| 3990 | + ulong operand, memory_order order, | ||
| 3991 | + memory_scope scope); | ||
| 3992 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, | ||
| 3993 | + long operand, memory_order order, | ||
| 3994 | + memory_scope scope); | ||
| 3995 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, | ||
| 3996 | + ulong operand, memory_order order, | ||
| 3997 | + memory_scope scope); | ||
| 3998 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, | ||
| 3999 | + long operand, memory_order order, | ||
| 4000 | + memory_scope scope); | ||
| 4001 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, | ||
| 4002 | + ulong operand, memory_order order, | ||
| 4003 | + memory_scope scope); | ||
| 4004 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, | ||
| 4005 | + long operand, memory_order order, | ||
| 4006 | + memory_scope scope); | ||
| 4007 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, | ||
| 4008 | + ulong operand, memory_order order, | ||
| 4009 | + memory_scope scope); | ||
| 4010 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4011 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4012 | + | ||
| 4013 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 4014 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 4015 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 4016 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 4017 | + | ||
| 4018 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4019 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4020 | +uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, | ||
| 4021 | + ptrdiff_t operand, | ||
| 4022 | + memory_order order); | ||
| 4023 | +uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, | ||
| 4024 | + ptrdiff_t operand, | ||
| 4025 | + memory_order order); | ||
| 4026 | +uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, | ||
| 4027 | + intptr_t operand, memory_order order); | ||
| 4028 | +uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, | ||
| 4029 | + intptr_t operand, | ||
| 4030 | + memory_order order); | ||
| 4031 | +uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, | ||
| 4032 | + intptr_t operand, | ||
| 4033 | + memory_order order); | ||
| 4034 | +uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, | ||
| 4035 | + intptr_t opermax, | ||
| 4036 | + memory_order minder); | ||
| 4037 | +uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, | ||
| 4038 | + intptr_t opermax, | ||
| 4039 | + memory_order minder); | ||
| 4040 | +intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, | ||
| 4041 | + uintptr_t operand, memory_order order); | ||
| 4042 | +intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, | ||
| 4043 | + uintptr_t operand, | ||
| 4044 | + memory_order order); | ||
| 4045 | +intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, | ||
| 4046 | + uintptr_t operand, | ||
| 4047 | + memory_order order); | ||
| 4048 | +intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, | ||
| 4049 | + uintptr_t opermax, | ||
| 4050 | + memory_order minder); | ||
| 4051 | +intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, | ||
| 4052 | + uintptr_t opermax, | ||
| 4053 | + memory_order minder); | ||
| 4054 | +#endif // __opencl_c_atomic_scope_device | ||
| 4055 | +uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, | ||
| 4056 | + ptrdiff_t operand, | ||
| 4057 | + memory_order order, | ||
| 4058 | + memory_scope scope); | ||
| 4059 | +uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, | ||
| 4060 | + ptrdiff_t operand, | ||
| 4061 | + memory_order order, | ||
| 4062 | + memory_scope scope); | ||
| 4063 | + | ||
| 4064 | +uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, | ||
| 4065 | + intptr_t operand, memory_order order, | ||
| 4066 | + memory_scope scope); | ||
| 4067 | +uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, | ||
| 4068 | + intptr_t operand, memory_order order, | ||
| 4069 | + memory_scope scope); | ||
| 4070 | +uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, | ||
| 4071 | + intptr_t operand, memory_order order, | ||
| 4072 | + memory_scope scope); | ||
| 4073 | +uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, | ||
| 4074 | + intptr_t opermax, | ||
| 4075 | + memory_order minder, | ||
| 4076 | + memory_scope scope); | ||
| 4077 | +uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, | ||
| 4078 | + intptr_t opermax, | ||
| 4079 | + memory_order minder, | ||
| 4080 | + memory_scope scope); | ||
| 4081 | + | ||
| 4082 | +intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, | ||
| 4083 | + uintptr_t operand, memory_order order, | ||
| 4084 | + memory_scope scope); | ||
| 4085 | +intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, | ||
| 4086 | + uintptr_t operand, memory_order order, | ||
| 4087 | + memory_scope scope); | ||
| 4088 | +intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, | ||
| 4089 | + uintptr_t operand, memory_order order, | ||
| 4090 | + memory_scope scope); | ||
| 4091 | +intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, | ||
| 4092 | + uintptr_t opermax, | ||
| 4093 | + memory_order minder, | ||
| 4094 | + memory_scope scope); | ||
| 4095 | +intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, | ||
| 4096 | + uintptr_t opermax, | ||
| 4097 | + memory_order minder, | ||
| 4098 | + memory_scope scope); | ||
| 4099 | #endif | ||
| 4100 | +#endif // __opencl_c_generic_address_space | ||
| 4101 | + | ||
| 4102 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4103 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4104 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __global *object, | ||
| 4105 | + int operand, memory_order order); | ||
| 4106 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __local *object, | ||
| 4107 | + int operand, memory_order order); | ||
| 4108 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __global *object, | ||
| 4109 | + uint operand, memory_order order); | ||
| 4110 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __local *object, | ||
| 4111 | + uint operand, memory_order order); | ||
| 4112 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __global *object, | ||
| 4113 | + int operand, memory_order order); | ||
| 4114 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __local *object, | ||
| 4115 | + int operand, memory_order order); | ||
| 4116 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __global *object, | ||
| 4117 | + uint operand, memory_order order); | ||
| 4118 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __local *object, | ||
| 4119 | + uint operand, memory_order order); | ||
| 4120 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __global *object, | ||
| 4121 | + int operand, memory_order order); | ||
| 4122 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __local *object, | ||
| 4123 | + int operand, memory_order order); | ||
| 4124 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __global *object, | ||
| 4125 | + uint operand, memory_order order); | ||
| 4126 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __local *object, | ||
| 4127 | + uint operand, memory_order order); | ||
| 4128 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __global *object, | ||
| 4129 | + int operand, memory_order order); | ||
| 4130 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __local *object, | ||
| 4131 | + int operand, memory_order order); | ||
| 4132 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __global *object, | ||
| 4133 | + uint operand, memory_order order); | ||
| 4134 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __local *object, | ||
| 4135 | + uint operand, memory_order order); | ||
| 4136 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __global *object, | ||
| 4137 | + int operand, memory_order order); | ||
| 4138 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __local *object, | ||
| 4139 | + int operand, memory_order order); | ||
| 4140 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __global *object, | ||
| 4141 | + uint operand, memory_order order); | ||
| 4142 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __local *object, | ||
| 4143 | + uint operand, memory_order order); | ||
| 4144 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __global *object, | ||
| 4145 | + int operand, memory_order order); | ||
| 4146 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __local *object, | ||
| 4147 | + int operand, memory_order order); | ||
| 4148 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __global *object, | ||
| 4149 | + uint operand, memory_order order); | ||
| 4150 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __local *object, | ||
| 4151 | + uint operand, memory_order order); | ||
| 4152 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __global *object, | ||
| 4153 | + int operand, memory_order order); | ||
| 4154 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __local *object, | ||
| 4155 | + int operand, memory_order order); | ||
| 4156 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __global *object, | ||
| 4157 | + uint operand, memory_order order); | ||
| 4158 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __local *object, | ||
| 4159 | + uint operand, memory_order order); | ||
| 4160 | +#endif // __opencl_c_atomic_scope_device | ||
| 4161 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __global *object, | ||
| 4162 | + int operand, memory_order order, | ||
| 4163 | + memory_scope scope); | ||
| 4164 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __local *object, | ||
| 4165 | + int operand, memory_order order, | ||
| 4166 | + memory_scope scope); | ||
| 4167 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __global *object, | ||
| 4168 | + uint operand, memory_order order, | ||
| 4169 | + memory_scope scope); | ||
| 4170 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __local *object, | ||
| 4171 | + uint operand, memory_order order, | ||
| 4172 | + memory_scope scope); | ||
| 4173 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __global *object, | ||
| 4174 | + int operand, memory_order order, | ||
| 4175 | + memory_scope scope); | ||
| 4176 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __local *object, | ||
| 4177 | + int operand, memory_order order, | ||
| 4178 | + memory_scope scope); | ||
| 4179 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __global *object, | ||
| 4180 | + uint operand, memory_order order, | ||
| 4181 | + memory_scope scope); | ||
| 4182 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __local *object, | ||
| 4183 | + uint operand, memory_order order, | ||
| 4184 | + memory_scope scope); | ||
| 4185 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __global *object, | ||
| 4186 | + int operand, memory_order order, | ||
| 4187 | + memory_scope scope); | ||
| 4188 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __local *object, | ||
| 4189 | + int operand, memory_order order, | ||
| 4190 | + memory_scope scope); | ||
| 4191 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __global *object, | ||
| 4192 | + uint operand, memory_order order, | ||
| 4193 | + memory_scope scope); | ||
| 4194 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __local *object, | ||
| 4195 | + uint operand, memory_order order, | ||
| 4196 | + memory_scope scope); | ||
| 4197 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __global *object, | ||
| 4198 | + int operand, memory_order order, | ||
| 4199 | + memory_scope scope); | ||
| 4200 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __local *object, | ||
| 4201 | + int operand, memory_order order, | ||
| 4202 | + memory_scope scope); | ||
| 4203 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __global *object, | ||
| 4204 | + uint operand, memory_order order, | ||
| 4205 | + memory_scope scope); | ||
| 4206 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __local *object, | ||
| 4207 | + uint operand, memory_order order, | ||
| 4208 | + memory_scope scope); | ||
| 4209 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __global *object, | ||
| 4210 | + int operand, memory_order order, | ||
| 4211 | + memory_scope scope); | ||
| 4212 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __local *object, | ||
| 4213 | + int operand, memory_order order, | ||
| 4214 | + memory_scope scope); | ||
| 4215 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __global *object, | ||
| 4216 | + uint operand, memory_order order, | ||
| 4217 | + memory_scope scope); | ||
| 4218 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __local *object, | ||
| 4219 | + uint operand, memory_order order, | ||
| 4220 | + memory_scope scope); | ||
| 4221 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __global *object, | ||
| 4222 | + int operand, memory_order order, | ||
| 4223 | + memory_scope scope); | ||
| 4224 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __local *object, | ||
| 4225 | + int operand, memory_order order, | ||
| 4226 | + memory_scope scope); | ||
| 4227 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __global *object, | ||
| 4228 | + uint operand, memory_order order, | ||
| 4229 | + memory_scope scope); | ||
| 4230 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __local *object, | ||
| 4231 | + uint operand, memory_order order, | ||
| 4232 | + memory_scope scope); | ||
| 4233 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __global *object, | ||
| 4234 | + int operand, memory_order order, | ||
| 4235 | + memory_scope scope); | ||
| 4236 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __local *object, | ||
| 4237 | + int operand, memory_order order, | ||
| 4238 | + memory_scope scope); | ||
| 4239 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __global *object, | ||
| 4240 | + uint operand, memory_order order, | ||
| 4241 | + memory_scope scope); | ||
| 4242 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __local *object, | ||
| 4243 | + uint operand, memory_order order, | ||
| 4244 | + memory_scope scope); | ||
| 4245 | + | ||
| 4246 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4247 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4248 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __global *object, | ||
| 4249 | + long operand, memory_order order); | ||
| 4250 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __local *object, | ||
| 4251 | + long operand, memory_order order); | ||
| 4252 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __global *object, | ||
| 4253 | + ulong operand, memory_order order); | ||
| 4254 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __local *object, | ||
| 4255 | + ulong operand, memory_order order); | ||
| 4256 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __global *object, | ||
| 4257 | + long operand, memory_order order); | ||
| 4258 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __local *object, | ||
| 4259 | + long operand, memory_order order); | ||
| 4260 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __global *object, | ||
| 4261 | + ulong operand, memory_order order); | ||
| 4262 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __local *object, | ||
| 4263 | + ulong operand, memory_order order); | ||
| 4264 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __global *object, | ||
| 4265 | + long operand, memory_order order); | ||
| 4266 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __local *object, | ||
| 4267 | + long operand, memory_order order); | ||
| 4268 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __global *object, | ||
| 4269 | + ulong operand, memory_order order); | ||
| 4270 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __local *object, | ||
| 4271 | + ulong operand, memory_order order); | ||
| 4272 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __global *object, | ||
| 4273 | + long operand, memory_order order); | ||
| 4274 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __local *object, | ||
| 4275 | + long operand, memory_order order); | ||
| 4276 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __global *object, | ||
| 4277 | + ulong operand, memory_order order); | ||
| 4278 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __local *object, | ||
| 4279 | + ulong operand, memory_order order); | ||
| 4280 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __global *object, | ||
| 4281 | + long operand, memory_order order); | ||
| 4282 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __local *object, | ||
| 4283 | + long operand, memory_order order); | ||
| 4284 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __global *object, | ||
| 4285 | + ulong operand, memory_order order); | ||
| 4286 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __local *object, | ||
| 4287 | + ulong operand, memory_order order); | ||
| 4288 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __global *object, | ||
| 4289 | + long operand, memory_order order); | ||
| 4290 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __local *object, | ||
| 4291 | + long operand, memory_order order); | ||
| 4292 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __global *object, | ||
| 4293 | + ulong operand, memory_order order); | ||
| 4294 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __local *object, | ||
| 4295 | + ulong operand, memory_order order); | ||
| 4296 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __global *object, | ||
| 4297 | + long operand, memory_order order); | ||
| 4298 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __local *object, | ||
| 4299 | + long operand, memory_order order); | ||
| 4300 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __global *object, | ||
| 4301 | + ulong operand, memory_order order); | ||
| 4302 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __local *object, | ||
| 4303 | + ulong operand, memory_order order); | ||
| 4304 | +#endif // __opencl_c_atomic_scope_device | ||
| 4305 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __global *object, | ||
| 4306 | + long operand, memory_order order, | ||
| 4307 | + memory_scope scope); | ||
| 4308 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __local *object, | ||
| 4309 | + long operand, memory_order order, | ||
| 4310 | + memory_scope scope); | ||
| 4311 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __global *object, | ||
| 4312 | + ulong operand, memory_order order, | ||
| 4313 | + memory_scope scope); | ||
| 4314 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __local *object, | ||
| 4315 | + ulong operand, memory_order order, | ||
| 4316 | + memory_scope scope); | ||
| 4317 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __global *object, | ||
| 4318 | + long operand, memory_order order, | ||
| 4319 | + memory_scope scope); | ||
| 4320 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __local *object, | ||
| 4321 | + long operand, memory_order order, | ||
| 4322 | + memory_scope scope); | ||
| 4323 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __global *object, | ||
| 4324 | + ulong operand, memory_order order, | ||
| 4325 | + memory_scope scope); | ||
| 4326 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __local *object, | ||
| 4327 | + ulong operand, memory_order order, | ||
| 4328 | + memory_scope scope); | ||
| 4329 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __global *object, | ||
| 4330 | + long operand, memory_order order, | ||
| 4331 | + memory_scope scope); | ||
| 4332 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __local *object, | ||
| 4333 | + long operand, memory_order order, | ||
| 4334 | + memory_scope scope); | ||
| 4335 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __global *object, | ||
| 4336 | + ulong operand, memory_order order, | ||
| 4337 | + memory_scope scope); | ||
| 4338 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __local *object, | ||
| 4339 | + ulong operand, memory_order order, | ||
| 4340 | + memory_scope scope); | ||
| 4341 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __global *object, | ||
| 4342 | + long operand, memory_order order, | ||
| 4343 | + memory_scope scope); | ||
| 4344 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __local *object, | ||
| 4345 | + long operand, memory_order order, | ||
| 4346 | + memory_scope scope); | ||
| 4347 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __global *object, | ||
| 4348 | + ulong operand, memory_order order, | ||
| 4349 | + memory_scope scope); | ||
| 4350 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __local *object, | ||
| 4351 | + ulong operand, memory_order order, | ||
| 4352 | + memory_scope scope); | ||
| 4353 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __global *object, | ||
| 4354 | + long operand, memory_order order, | ||
| 4355 | + memory_scope scope); | ||
| 4356 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __local *object, | ||
| 4357 | + long operand, memory_order order, | ||
| 4358 | + memory_scope scope); | ||
| 4359 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __global *object, | ||
| 4360 | + ulong operand, memory_order order, | ||
| 4361 | + memory_scope scope); | ||
| 4362 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __local *object, | ||
| 4363 | + ulong operand, memory_order order, | ||
| 4364 | + memory_scope scope); | ||
| 4365 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __global *object, | ||
| 4366 | + long operand, memory_order order, | ||
| 4367 | + memory_scope scope); | ||
| 4368 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __local *object, | ||
| 4369 | + long operand, memory_order order, | ||
| 4370 | + memory_scope scope); | ||
| 4371 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __global *object, | ||
| 4372 | + ulong operand, memory_order order, | ||
| 4373 | + memory_scope scope); | ||
| 4374 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __local *object, | ||
| 4375 | + ulong operand, memory_order order, | ||
| 4376 | + memory_scope scope); | ||
| 4377 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __global *object, | ||
| 4378 | + long operand, memory_order order, | ||
| 4379 | + memory_scope scope); | ||
| 4380 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __local *object, | ||
| 4381 | + long operand, memory_order order, | ||
| 4382 | + memory_scope scope); | ||
| 4383 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __global *object, | ||
| 4384 | + ulong operand, memory_order order, | ||
| 4385 | + memory_scope scope); | ||
| 4386 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __local *object, | ||
| 4387 | + ulong operand, memory_order order, | ||
| 4388 | + memory_scope scope); | ||
| 4389 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4390 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4391 | + | ||
| 4392 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 4393 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 4394 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 4395 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 4396 | + | ||
| 4397 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4398 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4399 | +uintptr_t __ovld | ||
| 4400 | +atomic_fetch_add_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4401 | + ptrdiff_t operand, memory_order order); | ||
| 4402 | +uintptr_t __ovld | ||
| 4403 | +atomic_fetch_add_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4404 | + ptrdiff_t operand, memory_order order); | ||
| 4405 | +uintptr_t __ovld | ||
| 4406 | +atomic_fetch_sub_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4407 | + ptrdiff_t operand, memory_order order); | ||
| 4408 | +uintptr_t __ovld | ||
| 4409 | +atomic_fetch_sub_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4410 | + ptrdiff_t operand, memory_order order); | ||
| 4411 | +uintptr_t __ovld | ||
| 4412 | +atomic_fetch_or_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4413 | + intptr_t operand, memory_order order); | ||
| 4414 | +uintptr_t __ovld | ||
| 4415 | +atomic_fetch_or_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4416 | + intptr_t operand, memory_order order); | ||
| 4417 | +uintptr_t __ovld | ||
| 4418 | +atomic_fetch_xor_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4419 | + intptr_t operand, memory_order order); | ||
| 4420 | +uintptr_t __ovld | ||
| 4421 | +atomic_fetch_xor_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4422 | + intptr_t operand, memory_order order); | ||
| 4423 | +uintptr_t __ovld | ||
| 4424 | +atomic_fetch_and_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4425 | + intptr_t operand, memory_order order); | ||
| 4426 | +uintptr_t __ovld | ||
| 4427 | +atomic_fetch_and_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4428 | + intptr_t operand, memory_order order); | ||
| 4429 | +uintptr_t __ovld | ||
| 4430 | +atomic_fetch_min_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4431 | + intptr_t opermax, memory_order minder); | ||
| 4432 | +uintptr_t __ovld | ||
| 4433 | +atomic_fetch_min_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4434 | + intptr_t opermax, memory_order minder); | ||
| 4435 | +uintptr_t __ovld | ||
| 4436 | +atomic_fetch_max_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4437 | + intptr_t opermax, memory_order minder); | ||
| 4438 | +uintptr_t __ovld | ||
| 4439 | +atomic_fetch_max_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4440 | + intptr_t opermax, memory_order minder); | ||
| 4441 | +intptr_t __ovld | ||
| 4442 | +atomic_fetch_or_explicit(volatile atomic_intptr_t __global *object, | ||
| 4443 | + uintptr_t operand, memory_order order); | ||
| 4444 | +intptr_t __ovld | ||
| 4445 | +atomic_fetch_or_explicit(volatile atomic_intptr_t __local *object, | ||
| 4446 | + uintptr_t operand, memory_order order); | ||
| 4447 | +intptr_t __ovld | ||
| 4448 | +atomic_fetch_xor_explicit(volatile atomic_intptr_t __global *object, | ||
| 4449 | + uintptr_t operand, memory_order order); | ||
| 4450 | +intptr_t __ovld | ||
| 4451 | +atomic_fetch_xor_explicit(volatile atomic_intptr_t __local *object, | ||
| 4452 | + uintptr_t operand, memory_order order); | ||
| 4453 | +intptr_t __ovld | ||
| 4454 | +atomic_fetch_and_explicit(volatile atomic_intptr_t __global *object, | ||
| 4455 | + uintptr_t operand, memory_order order); | ||
| 4456 | +intptr_t __ovld | ||
| 4457 | +atomic_fetch_and_explicit(volatile atomic_intptr_t __local *object, | ||
| 4458 | + uintptr_t operand, memory_order order); | ||
| 4459 | +intptr_t __ovld | ||
| 4460 | +atomic_fetch_min_explicit(volatile atomic_intptr_t __global *object, | ||
| 4461 | + uintptr_t opermax, memory_order minder); | ||
| 4462 | +intptr_t __ovld | ||
| 4463 | +atomic_fetch_min_explicit(volatile atomic_intptr_t __local *object, | ||
| 4464 | + uintptr_t opermax, memory_order minder); | ||
| 4465 | +intptr_t __ovld | ||
| 4466 | +atomic_fetch_max_explicit(volatile atomic_intptr_t __global *object, | ||
| 4467 | + uintptr_t opermax, memory_order minder); | ||
| 4468 | +intptr_t __ovld | ||
| 4469 | +atomic_fetch_max_explicit(volatile atomic_intptr_t __local *object, | ||
| 4470 | + uintptr_t opermax, memory_order minder); | ||
| 4471 | +#endif // __opencl_c_atomic_scope_device | ||
| 4472 | +uintptr_t __ovld atomic_fetch_add_explicit( | ||
| 4473 | + volatile atomic_uintptr_t __global *object, ptrdiff_t operand, | ||
| 4474 | + memory_order order, memory_scope scope); | ||
| 4475 | +uintptr_t __ovld atomic_fetch_add_explicit( | ||
| 4476 | + volatile atomic_uintptr_t __local *object, ptrdiff_t operand, | ||
| 4477 | + memory_order order, memory_scope scope); | ||
| 4478 | +uintptr_t __ovld atomic_fetch_sub_explicit( | ||
| 4479 | + volatile atomic_uintptr_t __global *object, ptrdiff_t operand, | ||
| 4480 | + memory_order order, memory_scope scope); | ||
| 4481 | +uintptr_t __ovld atomic_fetch_sub_explicit( | ||
| 4482 | + volatile atomic_uintptr_t __local *object, ptrdiff_t operand, | ||
| 4483 | + memory_order order, memory_scope scope); | ||
| 4484 | + | ||
| 4485 | +uintptr_t __ovld atomic_fetch_or_explicit( | ||
| 4486 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4487 | + memory_order order, memory_scope scope); | ||
| 4488 | +uintptr_t __ovld atomic_fetch_or_explicit( | ||
| 4489 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4490 | + memory_order order, memory_scope scope); | ||
| 4491 | +uintptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4492 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4493 | + memory_order order, memory_scope scope); | ||
| 4494 | +uintptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4495 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4496 | + memory_order order, memory_scope scope); | ||
| 4497 | +uintptr_t __ovld atomic_fetch_and_explicit( | ||
| 4498 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4499 | + memory_order order, memory_scope scope); | ||
| 4500 | +uintptr_t __ovld atomic_fetch_and_explicit( | ||
| 4501 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4502 | + memory_order order, memory_scope scope); | ||
| 4503 | +uintptr_t __ovld atomic_fetch_min_explicit( | ||
| 4504 | + volatile atomic_uintptr_t __global *object, intptr_t opermax, | ||
| 4505 | + memory_order minder, memory_scope scope); | ||
| 4506 | +uintptr_t __ovld atomic_fetch_min_explicit( | ||
| 4507 | + volatile atomic_uintptr_t __local *object, intptr_t opermax, | ||
| 4508 | + memory_order minder, memory_scope scope); | ||
| 4509 | +uintptr_t __ovld atomic_fetch_max_explicit( | ||
| 4510 | + volatile atomic_uintptr_t __global *object, intptr_t opermax, | ||
| 4511 | + memory_order minder, memory_scope scope); | ||
| 4512 | +uintptr_t __ovld atomic_fetch_max_explicit( | ||
| 4513 | + volatile atomic_uintptr_t __local *object, intptr_t opermax, | ||
| 4514 | + memory_order minder, memory_scope scope); | ||
| 4515 | + | ||
| 4516 | +intptr_t __ovld atomic_fetch_or_explicit( | ||
| 4517 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4518 | + memory_order order, memory_scope scope); | ||
| 4519 | +intptr_t __ovld atomic_fetch_or_explicit( | ||
| 4520 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4521 | + memory_order order, memory_scope scope); | ||
| 4522 | +intptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4523 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4524 | + memory_order order, memory_scope scope); | ||
| 4525 | +intptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4526 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4527 | + memory_order order, memory_scope scope); | ||
| 4528 | +intptr_t __ovld atomic_fetch_and_explicit( | ||
| 4529 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4530 | + memory_order order, memory_scope scope); | ||
| 4531 | +intptr_t __ovld atomic_fetch_and_explicit( | ||
| 4532 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4533 | + memory_order order, memory_scope scope); | ||
| 4534 | +intptr_t __ovld atomic_fetch_min_explicit( | ||
| 4535 | + volatile atomic_intptr_t __global *object, uintptr_t opermax, | ||
| 4536 | + memory_order minder, memory_scope scope); | ||
| 4537 | +intptr_t __ovld atomic_fetch_min_explicit( | ||
| 4538 | + volatile atomic_intptr_t __local *object, uintptr_t opermax, | ||
| 4539 | + memory_order minder, memory_scope scope); | ||
| 4540 | +intptr_t __ovld atomic_fetch_max_explicit( | ||
| 4541 | + volatile atomic_intptr_t __global *object, uintptr_t opermax, | ||
| 4542 | + memory_order minder, memory_scope scope); | ||
| 4543 | +intptr_t __ovld atomic_fetch_max_explicit( | ||
| 4544 | + volatile atomic_intptr_t __local *object, uintptr_t opermax, | ||
| 4545 | + memory_order minder, memory_scope scope); | ||
| 4546 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4547 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4548 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4549 | |||
| 4550 | // atomic_store() | ||
| 4551 | |||
| 4552 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4553 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4554 | + | ||
| 4555 | +#ifdef __opencl_c_generic_address_space | ||
| 4556 | void __ovld atomic_store(volatile atomic_int *object, int desired); | ||
| 4557 | -void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, memory_order order); | ||
| 4558 | -void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, memory_order order, memory_scope scope); | ||
| 4559 | void __ovld atomic_store(volatile atomic_uint *object, uint desired); | ||
| 4560 | -void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, memory_order order); | ||
| 4561 | -void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, memory_order order, memory_scope scope); | ||
| 4562 | void __ovld atomic_store(volatile atomic_float *object, float desired); | ||
| 4563 | -void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, memory_order order); | ||
| 4564 | -void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, memory_order order, memory_scope scope); | ||
| 4565 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4566 | -#ifdef cl_khr_fp64 | ||
| 4567 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4568 | void __ovld atomic_store(volatile atomic_double *object, double desired); | ||
| 4569 | -void __ovld atomic_store_explicit(volatile atomic_double *object, double desired, memory_order order); | ||
| 4570 | -void __ovld atomic_store_explicit(volatile atomic_double *object, double desired, memory_order order, memory_scope scope); | ||
| 4571 | -#endif //cl_khr_fp64 | ||
| 4572 | +#endif | ||
| 4573 | void __ovld atomic_store(volatile atomic_long *object, long desired); | ||
| 4574 | -void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, memory_order order); | ||
| 4575 | -void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, memory_order order, memory_scope scope); | ||
| 4576 | void __ovld atomic_store(volatile atomic_ulong *object, ulong desired); | ||
| 4577 | -void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, memory_order order); | ||
| 4578 | -void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, memory_order order, memory_scope scope); | ||
| 4579 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4580 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4581 | +#endif // __opencl_c_generic_address_space | ||
| 4582 | + | ||
| 4583 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4584 | +void __ovld atomic_store(volatile atomic_int __global *object, int desired); | ||
| 4585 | +void __ovld atomic_store(volatile atomic_int __local *object, int desired); | ||
| 4586 | +void __ovld atomic_store(volatile atomic_uint __global *object, uint desired); | ||
| 4587 | +void __ovld atomic_store(volatile atomic_uint __local *object, uint desired); | ||
| 4588 | +void __ovld atomic_store(volatile atomic_float __global *object, float desired); | ||
| 4589 | +void __ovld atomic_store(volatile atomic_float __local *object, float desired); | ||
| 4590 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4591 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4592 | +void __ovld atomic_store(volatile atomic_double __global *object, | ||
| 4593 | + double desired); | ||
| 4594 | +void __ovld atomic_store(volatile atomic_double __local *object, | ||
| 4595 | + double desired); | ||
| 4596 | #endif | ||
| 4597 | +void __ovld atomic_store(volatile atomic_long __global *object, long desired); | ||
| 4598 | +void __ovld atomic_store(volatile atomic_long __local *object, long desired); | ||
| 4599 | +void __ovld atomic_store(volatile atomic_ulong __global *object, ulong desired); | ||
| 4600 | +void __ovld atomic_store(volatile atomic_ulong __local *object, ulong desired); | ||
| 4601 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4602 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4603 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4604 | + | ||
| 4605 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4606 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4607 | + | ||
| 4608 | +#ifdef __opencl_c_generic_address_space | ||
| 4609 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4610 | +void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, | ||
| 4611 | + memory_order order); | ||
| 4612 | +void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, | ||
| 4613 | + memory_order order); | ||
| 4614 | +void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, | ||
| 4615 | + memory_order order); | ||
| 4616 | +#endif // __opencl_c_atomic_scope_device | ||
| 4617 | +void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, | ||
| 4618 | + memory_order order, memory_scope scope); | ||
| 4619 | +void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, | ||
| 4620 | + memory_order order, memory_scope scope); | ||
| 4621 | +void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, | ||
| 4622 | + memory_order order, memory_scope scope); | ||
| 4623 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4624 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4625 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4626 | +void __ovld atomic_store_explicit(volatile atomic_double *object, | ||
| 4627 | + double desired, memory_order order); | ||
| 4628 | +#endif //__opencl_c_atomic_scope_device | ||
| 4629 | +void __ovld atomic_store_explicit(volatile atomic_double *object, | ||
| 4630 | + double desired, memory_order order, | ||
| 4631 | + memory_scope scope); | ||
| 4632 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4633 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4634 | +void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, | ||
| 4635 | + memory_order order); | ||
| 4636 | +void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, | ||
| 4637 | + memory_order order); | ||
| 4638 | +#endif //__opencl_c_atomic_scope_device | ||
| 4639 | +void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, | ||
| 4640 | + memory_order order, memory_scope scope); | ||
| 4641 | +void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, | ||
| 4642 | + memory_order order, memory_scope scope); | ||
| 4643 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4644 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4645 | +#endif // __opencl_c_generic_address_space | ||
| 4646 | + | ||
| 4647 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4648 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4649 | +void __ovld atomic_store_explicit(volatile atomic_int __global *object, | ||
| 4650 | + int desired, memory_order order); | ||
| 4651 | +void __ovld atomic_store_explicit(volatile atomic_int __local *object, | ||
| 4652 | + int desired, memory_order order); | ||
| 4653 | +void __ovld atomic_store_explicit(volatile atomic_uint __global *object, | ||
| 4654 | + uint desired, memory_order order); | ||
| 4655 | +void __ovld atomic_store_explicit(volatile atomic_uint __local *object, | ||
| 4656 | + uint desired, memory_order order); | ||
| 4657 | +void __ovld atomic_store_explicit(volatile atomic_float __global *object, | ||
| 4658 | + float desired, memory_order order); | ||
| 4659 | +void __ovld atomic_store_explicit(volatile atomic_float __local *object, | ||
| 4660 | + float desired, memory_order order); | ||
| 4661 | +#endif // __opencl_c_atomic_scope_device | ||
| 4662 | +void __ovld atomic_store_explicit(volatile atomic_int __global *object, | ||
| 4663 | + int desired, memory_order order, | ||
| 4664 | + memory_scope scope); | ||
| 4665 | +void __ovld atomic_store_explicit(volatile atomic_int __local *object, | ||
| 4666 | + int desired, memory_order order, | ||
| 4667 | + memory_scope scope); | ||
| 4668 | +void __ovld atomic_store_explicit(volatile atomic_uint __global *object, | ||
| 4669 | + uint desired, memory_order order, | ||
| 4670 | + memory_scope scope); | ||
| 4671 | +void __ovld atomic_store_explicit(volatile atomic_uint __local *object, | ||
| 4672 | + uint desired, memory_order order, | ||
| 4673 | + memory_scope scope); | ||
| 4674 | +void __ovld atomic_store_explicit(volatile atomic_float __global *object, | ||
| 4675 | + float desired, memory_order order, | ||
| 4676 | + memory_scope scope); | ||
| 4677 | +void __ovld atomic_store_explicit(volatile atomic_float __local *object, | ||
| 4678 | + float desired, memory_order order, | ||
| 4679 | + memory_scope scope); | ||
| 4680 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4681 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4682 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4683 | +void __ovld atomic_store_explicit(volatile atomic_double __global *object, | ||
| 4684 | + double desired, memory_order order); | ||
| 4685 | +void __ovld atomic_store_explicit(volatile atomic_double __local *object, | ||
| 4686 | + double desired, memory_order order); | ||
| 4687 | +#endif //__opencl_c_atomic_scope_device | ||
| 4688 | +void __ovld atomic_store_explicit(volatile atomic_double __global *object, | ||
| 4689 | + double desired, memory_order order, | ||
| 4690 | + memory_scope scope); | ||
| 4691 | +void __ovld atomic_store_explicit(volatile atomic_double __local *object, | ||
| 4692 | + double desired, memory_order order, | ||
| 4693 | + memory_scope scope); | ||
| 4694 | +#endif // cl_khr_fp64 | ||
| 4695 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4696 | +void __ovld atomic_store_explicit(volatile atomic_long __global *object, | ||
| 4697 | + long desired, memory_order order); | ||
| 4698 | +void __ovld atomic_store_explicit(volatile atomic_long __local *object, | ||
| 4699 | + long desired, memory_order order); | ||
| 4700 | +void __ovld atomic_store_explicit(volatile atomic_ulong __global *object, | ||
| 4701 | + ulong desired, memory_order order); | ||
| 4702 | +void __ovld atomic_store_explicit(volatile atomic_ulong __local *object, | ||
| 4703 | + ulong desired, memory_order order); | ||
| 4704 | +#endif // __opencl_c_atomic_scope_device | ||
| 4705 | +void __ovld atomic_store_explicit(volatile atomic_long __global *object, | ||
| 4706 | + long desired, memory_order order, | ||
| 4707 | + memory_scope scope); | ||
| 4708 | +void __ovld atomic_store_explicit(volatile atomic_long __local *object, | ||
| 4709 | + long desired, memory_order order, | ||
| 4710 | + memory_scope scope); | ||
| 4711 | +void __ovld atomic_store_explicit(volatile atomic_ulong __global *object, | ||
| 4712 | + ulong desired, memory_order order, | ||
| 4713 | + memory_scope scope); | ||
| 4714 | +void __ovld atomic_store_explicit(volatile atomic_ulong __local *object, | ||
| 4715 | + ulong desired, memory_order order, | ||
| 4716 | + memory_scope scope); | ||
| 4717 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4718 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4719 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4720 | |||
| 4721 | // atomic_load() | ||
| 4722 | - | ||
| 4723 | +#ifdef __opencl_c_generic_address_space | ||
| 4724 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4725 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4726 | int __ovld atomic_load(volatile atomic_int *object); | ||
| 4727 | -int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order); | ||
| 4728 | -int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order, memory_scope scope); | ||
| 4729 | uint __ovld atomic_load(volatile atomic_uint *object); | ||
| 4730 | -uint __ovld atomic_load_explicit(volatile atomic_uint *object, memory_order order); | ||
| 4731 | -uint __ovld atomic_load_explicit(volatile atomic_uint *object, memory_order order, memory_scope scope); | ||
| 4732 | float __ovld atomic_load(volatile atomic_float *object); | ||
| 4733 | -float __ovld atomic_load_explicit(volatile atomic_float *object, memory_order order); | ||
| 4734 | -float __ovld atomic_load_explicit(volatile atomic_float *object, memory_order order, memory_scope scope); | ||
| 4735 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4736 | -#ifdef cl_khr_fp64 | ||
| 4737 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4738 | double __ovld atomic_load(volatile atomic_double *object); | ||
| 4739 | -double __ovld atomic_load_explicit(volatile atomic_double *object, memory_order order); | ||
| 4740 | -double __ovld atomic_load_explicit(volatile atomic_double *object, memory_order order, memory_scope scope); | ||
| 4741 | -#endif //cl_khr_fp64 | ||
| 4742 | +#endif // cl_khr_fp64 | ||
| 4743 | long __ovld atomic_load(volatile atomic_long *object); | ||
| 4744 | -long __ovld atomic_load_explicit(volatile atomic_long *object, memory_order order); | ||
| 4745 | -long __ovld atomic_load_explicit(volatile atomic_long *object, memory_order order, memory_scope scope); | ||
| 4746 | ulong __ovld atomic_load(volatile atomic_ulong *object); | ||
| 4747 | -ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, memory_order order); | ||
| 4748 | -ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, memory_order order, memory_scope scope); | ||
| 4749 | -#endif | ||
| 4750 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4751 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4752 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4753 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4754 | +#endif //__opencl_c_generic_address_space | ||
| 4755 | + | ||
| 4756 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4757 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4758 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4759 | +int __ovld atomic_load(volatile atomic_int __global *object); | ||
| 4760 | +int __ovld atomic_load(volatile atomic_int __local *object); | ||
| 4761 | +uint __ovld atomic_load(volatile atomic_uint __global *object); | ||
| 4762 | +uint __ovld atomic_load(volatile atomic_uint __local *object); | ||
| 4763 | +float __ovld atomic_load(volatile atomic_float __global *object); | ||
| 4764 | +float __ovld atomic_load(volatile atomic_float __local *object); | ||
| 4765 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4766 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4767 | +double __ovld atomic_load(volatile atomic_double __global *object); | ||
| 4768 | +double __ovld atomic_load(volatile atomic_double __local *object); | ||
| 4769 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4770 | +long __ovld atomic_load(volatile atomic_long __global *object); | ||
| 4771 | +long __ovld atomic_load(volatile atomic_long __local *object); | ||
| 4772 | +ulong __ovld atomic_load(volatile atomic_ulong __global *object); | ||
| 4773 | +ulong __ovld atomic_load(volatile atomic_ulong __local *object); | ||
| 4774 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4775 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4776 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4777 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4778 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4779 | + | ||
| 4780 | +#ifdef __opencl_c_generic_address_space | ||
| 4781 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4782 | +int __ovld atomic_load_explicit(volatile atomic_int *object, | ||
| 4783 | + memory_order order); | ||
| 4784 | +uint __ovld atomic_load_explicit(volatile atomic_uint *object, | ||
| 4785 | + memory_order order); | ||
| 4786 | +float __ovld atomic_load_explicit(volatile atomic_float *object, | ||
| 4787 | + memory_order order); | ||
| 4788 | +#endif // __opencl_c_atomic_scope_device | ||
| 4789 | +int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order, | ||
| 4790 | + memory_scope scope); | ||
| 4791 | +uint __ovld atomic_load_explicit(volatile atomic_uint *object, | ||
| 4792 | + memory_order order, memory_scope scope); | ||
| 4793 | +float __ovld atomic_load_explicit(volatile atomic_float *object, | ||
| 4794 | + memory_order order, memory_scope scope); | ||
| 4795 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4796 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4797 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4798 | +double __ovld atomic_load_explicit(volatile atomic_double *object, | ||
| 4799 | + memory_order order); | ||
| 4800 | +#endif // __opencl_c_atomic_scope_device | ||
| 4801 | +double __ovld atomic_load_explicit(volatile atomic_double *object, | ||
| 4802 | + memory_order order, memory_scope scope); | ||
| 4803 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4804 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4805 | +long __ovld atomic_load_explicit(volatile atomic_long *object, | ||
| 4806 | + memory_order order); | ||
| 4807 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, | ||
| 4808 | + memory_order order); | ||
| 4809 | +#endif //__opencl_c_atomic_scope_device | ||
| 4810 | +long __ovld atomic_load_explicit(volatile atomic_long *object, | ||
| 4811 | + memory_order order, memory_scope scope); | ||
| 4812 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, | ||
| 4813 | + memory_order order, memory_scope scope); | ||
| 4814 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4815 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4816 | +#endif // __opencl_c_generic_address_space | ||
| 4817 | + | ||
| 4818 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4819 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4820 | +int __ovld atomic_load_explicit(volatile atomic_int __global *object, | ||
| 4821 | + memory_order order); | ||
| 4822 | +int __ovld atomic_load_explicit(volatile atomic_int __local *object, | ||
| 4823 | + memory_order order); | ||
| 4824 | +uint __ovld atomic_load_explicit(volatile atomic_uint __global *object, | ||
| 4825 | + memory_order order); | ||
| 4826 | +uint __ovld atomic_load_explicit(volatile atomic_uint __local *object, | ||
| 4827 | + memory_order order); | ||
| 4828 | +float __ovld atomic_load_explicit(volatile atomic_float __global *object, | ||
| 4829 | + memory_order order); | ||
| 4830 | +float __ovld atomic_load_explicit(volatile atomic_float __local *object, | ||
| 4831 | + memory_order order); | ||
| 4832 | +#endif // __opencl_c_atomic_scope_device | ||
| 4833 | +int __ovld atomic_load_explicit(volatile atomic_int __global *object, | ||
| 4834 | + memory_order order, memory_scope scope); | ||
| 4835 | +int __ovld atomic_load_explicit(volatile atomic_int __local *object, | ||
| 4836 | + memory_order order, memory_scope scope); | ||
| 4837 | +uint __ovld atomic_load_explicit(volatile atomic_uint __global *object, | ||
| 4838 | + memory_order order, memory_scope scope); | ||
| 4839 | +uint __ovld atomic_load_explicit(volatile atomic_uint __local *object, | ||
| 4840 | + memory_order order, memory_scope scope); | ||
| 4841 | +float __ovld atomic_load_explicit(volatile atomic_float __global *object, | ||
| 4842 | + memory_order order, memory_scope scope); | ||
| 4843 | +float __ovld atomic_load_explicit(volatile atomic_float __local *object, | ||
| 4844 | + memory_order order, memory_scope scope); | ||
| 4845 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4846 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4847 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4848 | +double __ovld atomic_load_explicit(volatile atomic_double __global *object, | ||
| 4849 | + memory_order order); | ||
| 4850 | +double __ovld atomic_load_explicit(volatile atomic_double __local *object, | ||
| 4851 | + memory_order order); | ||
| 4852 | +#endif // __opencl_c_atomic_scope_device | ||
| 4853 | +double __ovld atomic_load_explicit(volatile atomic_double __global *object, | ||
| 4854 | + memory_order order, memory_scope scope); | ||
| 4855 | +double __ovld atomic_load_explicit(volatile atomic_double __local *object, | ||
| 4856 | + memory_order order, memory_scope scope); | ||
| 4857 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4858 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4859 | +long __ovld atomic_load_explicit(volatile atomic_long __global *object, | ||
| 4860 | + memory_order order); | ||
| 4861 | +long __ovld atomic_load_explicit(volatile atomic_long __local *object, | ||
| 4862 | + memory_order order); | ||
| 4863 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __global *object, | ||
| 4864 | + memory_order order); | ||
| 4865 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __local *object, | ||
| 4866 | + memory_order order); | ||
| 4867 | +#endif // __opencl_c_atomic_scope_device | ||
| 4868 | +long __ovld atomic_load_explicit(volatile atomic_long __global *object, | ||
| 4869 | + memory_order order, memory_scope scope); | ||
| 4870 | +long __ovld atomic_load_explicit(volatile atomic_long __local *object, | ||
| 4871 | + memory_order order, memory_scope scope); | ||
| 4872 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __global *object, | ||
| 4873 | + memory_order order, memory_scope scope); | ||
| 4874 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __local *object, | ||
| 4875 | + memory_order order, memory_scope scope); | ||
| 4876 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4877 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4878 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4879 | |||
| 4880 | // atomic_exchange() | ||
| 4881 | - | ||
| 4882 | +#ifdef __opencl_c_generic_address_space | ||
| 4883 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4884 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4885 | int __ovld atomic_exchange(volatile atomic_int *object, int desired); | ||
| 4886 | -int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, memory_order order); | ||
| 4887 | -int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, memory_order order, memory_scope scope); | ||
| 4888 | uint __ovld atomic_exchange(volatile atomic_uint *object, uint desired); | ||
| 4889 | -uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, memory_order order); | ||
| 4890 | -uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, memory_order order, memory_scope scope); | ||
| 4891 | float __ovld atomic_exchange(volatile atomic_float *object, float desired); | ||
| 4892 | -float __ovld atomic_exchange_explicit(volatile atomic_float *object, float desired, memory_order order); | ||
| 4893 | -float __ovld atomic_exchange_explicit(volatile atomic_float *object, float desired, memory_order order, memory_scope scope); | ||
| 4894 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4895 | -#ifdef cl_khr_fp64 | ||
| 4896 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4897 | double __ovld atomic_exchange(volatile atomic_double *object, double desired); | ||
| 4898 | -double __ovld atomic_exchange_explicit(volatile atomic_double *object, double desired, memory_order order); | ||
| 4899 | -double __ovld atomic_exchange_explicit(volatile atomic_double *object, double desired, memory_order order, memory_scope scope); | ||
| 4900 | -#endif //cl_khr_fp64 | ||
| 4901 | +#endif | ||
| 4902 | long __ovld atomic_exchange(volatile atomic_long *object, long desired); | ||
| 4903 | -long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, memory_order order); | ||
| 4904 | -long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, memory_order order, memory_scope scope); | ||
| 4905 | ulong __ovld atomic_exchange(volatile atomic_ulong *object, ulong desired); | ||
| 4906 | -ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, ulong desired, memory_order order); | ||
| 4907 | -ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, ulong desired, memory_order order, memory_scope scope); | ||
| 4908 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4909 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4910 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4911 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4912 | +#endif // __opencl_c_generic_address_space | ||
| 4913 | + | ||
| 4914 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4915 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4916 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4917 | +int __ovld atomic_exchange(volatile atomic_int __global *object, int desired); | ||
| 4918 | +int __ovld atomic_exchange(volatile atomic_int __local *object, int desired); | ||
| 4919 | +uint __ovld atomic_exchange(volatile atomic_uint __global *object, | ||
| 4920 | + uint desired); | ||
| 4921 | +uint __ovld atomic_exchange(volatile atomic_uint __local *object, uint desired); | ||
| 4922 | +float __ovld atomic_exchange(volatile atomic_float __global *object, | ||
| 4923 | + float desired); | ||
| 4924 | +float __ovld atomic_exchange(volatile atomic_float __local *object, | ||
| 4925 | + float desired); | ||
| 4926 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4927 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4928 | +double __ovld atomic_exchange(volatile atomic_double __global *object, | ||
| 4929 | + double desired); | ||
| 4930 | +double __ovld atomic_exchange(volatile atomic_double __local *object, | ||
| 4931 | + double desired); | ||
| 4932 | #endif | ||
| 4933 | +long __ovld atomic_exchange(volatile atomic_long __global *object, | ||
| 4934 | + long desired); | ||
| 4935 | +long __ovld atomic_exchange(volatile atomic_long __local *object, long desired); | ||
| 4936 | +ulong __ovld atomic_exchange(volatile atomic_ulong __global *object, | ||
| 4937 | + ulong desired); | ||
| 4938 | +ulong __ovld atomic_exchange(volatile atomic_ulong __local *object, | ||
| 4939 | + ulong desired); | ||
| 4940 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4941 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4942 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4943 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4944 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4945 | + | ||
| 4946 | +#ifdef __opencl_c_generic_address_space | ||
| 4947 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4948 | +int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, | ||
| 4949 | + memory_order order); | ||
| 4950 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, | ||
| 4951 | + memory_order order); | ||
| 4952 | +float __ovld atomic_exchange_explicit(volatile atomic_float *object, | ||
| 4953 | + float desired, memory_order order); | ||
| 4954 | +#endif // __opencl_c_atomic_scope_device | ||
| 4955 | +int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, | ||
| 4956 | + memory_order order, memory_scope scope); | ||
| 4957 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, | ||
| 4958 | + memory_order order, memory_scope scope); | ||
| 4959 | +float __ovld atomic_exchange_explicit(volatile atomic_float *object, | ||
| 4960 | + float desired, memory_order order, | ||
| 4961 | + memory_scope scope); | ||
| 4962 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4963 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4964 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4965 | +double __ovld atomic_exchange_explicit(volatile atomic_double *object, | ||
| 4966 | + double desired, memory_order order); | ||
| 4967 | +#endif // __opencl_c_atomic_scope_device | ||
| 4968 | +double __ovld atomic_exchange_explicit(volatile atomic_double *object, | ||
| 4969 | + double desired, memory_order order, | ||
| 4970 | + memory_scope scope); | ||
| 4971 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4972 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4973 | +long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, | ||
| 4974 | + memory_order order); | ||
| 4975 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, | ||
| 4976 | + ulong desired, memory_order order); | ||
| 4977 | +#endif // __opencl_c_atomic_scope_device | ||
| 4978 | +long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, | ||
| 4979 | + memory_order order, memory_scope scope); | ||
| 4980 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, | ||
| 4981 | + ulong desired, memory_order order, | ||
| 4982 | + memory_scope scope); | ||
| 4983 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4984 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4985 | +#endif // __opencl_c_generic_address_space | ||
| 4986 | + | ||
| 4987 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4988 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4989 | +int __ovld atomic_exchange_explicit(volatile atomic_int __global *object, | ||
| 4990 | + int desired, memory_order order); | ||
| 4991 | +int __ovld atomic_exchange_explicit(volatile atomic_int __local *object, | ||
| 4992 | + int desired, memory_order order); | ||
| 4993 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __global *object, | ||
| 4994 | + uint desired, memory_order order); | ||
| 4995 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __local *object, | ||
| 4996 | + uint desired, memory_order order); | ||
| 4997 | +float __ovld atomic_exchange_explicit(volatile atomic_float __global *object, | ||
| 4998 | + float desired, memory_order order); | ||
| 4999 | +float __ovld atomic_exchange_explicit(volatile atomic_float __local *object, | ||
| 5000 | + float desired, memory_order order); | ||
| 5001 | +#endif // __opencl_c_atomic_scope_device | ||
| 5002 | +int __ovld atomic_exchange_explicit(volatile atomic_int __global *object, | ||
| 5003 | + int desired, memory_order order, | ||
| 5004 | + memory_scope scope); | ||
| 5005 | +int __ovld atomic_exchange_explicit(volatile atomic_int __local *object, | ||
| 5006 | + int desired, memory_order order, | ||
| 5007 | + memory_scope scope); | ||
| 5008 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __global *object, | ||
| 5009 | + uint desired, memory_order order, | ||
| 5010 | + memory_scope scope); | ||
| 5011 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __local *object, | ||
| 5012 | + uint desired, memory_order order, | ||
| 5013 | + memory_scope scope); | ||
| 5014 | +float __ovld atomic_exchange_explicit(volatile atomic_float __global *object, | ||
| 5015 | + float desired, memory_order order, | ||
| 5016 | + memory_scope scope); | ||
| 5017 | +float __ovld atomic_exchange_explicit(volatile atomic_float __local *object, | ||
| 5018 | + float desired, memory_order order, | ||
| 5019 | + memory_scope scope); | ||
| 5020 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5021 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5022 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5023 | +double __ovld atomic_exchange_explicit(volatile atomic_double __global *object, | ||
| 5024 | + double desired, memory_order order); | ||
| 5025 | +double __ovld atomic_exchange_explicit(volatile atomic_double __local *object, | ||
| 5026 | + double desired, memory_order order); | ||
| 5027 | +#endif // __opencl_c_atomic_scope_device | ||
| 5028 | +double __ovld atomic_exchange_explicit(volatile atomic_double __global *object, | ||
| 5029 | + double desired, memory_order order, | ||
| 5030 | + memory_scope scope); | ||
| 5031 | +double __ovld atomic_exchange_explicit(volatile atomic_double __local *object, | ||
| 5032 | + double desired, memory_order order, | ||
| 5033 | + memory_scope scope); | ||
| 5034 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5035 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5036 | +long __ovld atomic_exchange_explicit(volatile atomic_long __global *object, | ||
| 5037 | + long desired, memory_order order); | ||
| 5038 | +long __ovld atomic_exchange_explicit(volatile atomic_long __local *object, | ||
| 5039 | + long desired, memory_order order); | ||
| 5040 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __global *object, | ||
| 5041 | + ulong desired, memory_order order); | ||
| 5042 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __local *object, | ||
| 5043 | + ulong desired, memory_order order); | ||
| 5044 | +#endif // __opencl_c_atomic_scope_device | ||
| 5045 | +long __ovld atomic_exchange_explicit(volatile atomic_long __global *object, | ||
| 5046 | + long desired, memory_order order, | ||
| 5047 | + memory_scope scope); | ||
| 5048 | +long __ovld atomic_exchange_explicit(volatile atomic_long __local *object, | ||
| 5049 | + long desired, memory_order order, | ||
| 5050 | + memory_scope scope); | ||
| 5051 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __global *object, | ||
| 5052 | + ulong desired, memory_order order, | ||
| 5053 | + memory_scope scope); | ||
| 5054 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __local *object, | ||
| 5055 | + ulong desired, memory_order order, | ||
| 5056 | + memory_scope scope); | ||
| 5057 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5058 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5059 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5060 | |||
| 5061 | // atomic_compare_exchange_strong() and atomic_compare_exchange_weak() | ||
| 5062 | - | ||
| 5063 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_int *object, int *expected, int desired); | ||
| 5064 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, int *expected, | ||
| 5065 | - int desired, memory_order success, memory_order failure); | ||
| 5066 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, int *expected, | ||
| 5067 | - int desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5068 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_uint *object, uint *expected, uint desired); | ||
| 5069 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5070 | - uint desired, memory_order success, memory_order failure); | ||
| 5071 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5072 | - uint desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5073 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_int *object, int *expected, int desired); | ||
| 5074 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, int *expected, | ||
| 5075 | - int desired, memory_order success, memory_order failure); | ||
| 5076 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, int *expected, | ||
| 5077 | - int desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5078 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_uint *object, uint *expected, uint desired); | ||
| 5079 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5080 | - uint desired, memory_order success, memory_order failure); | ||
| 5081 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5082 | - uint desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5083 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_float *object, float *expected, float desired); | ||
| 5084 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_float *object, float *expected, | ||
| 5085 | - float desired, memory_order success, memory_order failure); | ||
| 5086 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_float *object, float *expected, | ||
| 5087 | - float desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5088 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_float *object, float *expected, float desired); | ||
| 5089 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, float *expected, | ||
| 5090 | - float desired, memory_order success, memory_order failure); | ||
| 5091 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, float *expected, | ||
| 5092 | - float desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5093 | +#ifdef __opencl_c_generic_address_space | ||
| 5094 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5095 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5096 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int *object, | ||
| 5097 | + int *expected, int desired); | ||
| 5098 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint *object, | ||
| 5099 | + uint *expected, uint desired); | ||
| 5100 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int *object, | ||
| 5101 | + int *expected, int desired); | ||
| 5102 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint *object, | ||
| 5103 | + uint *expected, uint desired); | ||
| 5104 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_float *object, | ||
| 5105 | + float *expected, float desired); | ||
| 5106 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float *object, | ||
| 5107 | + float *expected, float desired); | ||
| 5108 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5109 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5110 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_double *object, | ||
| 5111 | + double *expected, double desired); | ||
| 5112 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double *object, | ||
| 5113 | + double *expected, double desired); | ||
| 5114 | +#endif | ||
| 5115 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long *object, | ||
| 5116 | + long *expected, long desired); | ||
| 5117 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long *object, | ||
| 5118 | + long *expected, long desired); | ||
| 5119 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_ulong *object, | ||
| 5120 | + ulong *expected, ulong desired); | ||
| 5121 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong *object, | ||
| 5122 | + ulong *expected, ulong desired); | ||
| 5123 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5124 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5125 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5126 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5127 | +#endif // __opencl_c_generic_address_space | ||
| 5128 | + | ||
| 5129 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5130 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5131 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5132 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5133 | + int __global *expected, int desired); | ||
| 5134 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5135 | + int __global *expected, int desired); | ||
| 5136 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5137 | + int __local *expected, int desired); | ||
| 5138 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5139 | + int __local *expected, int desired); | ||
| 5140 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5141 | + int __private *expected, | ||
| 5142 | + int desired); | ||
| 5143 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5144 | + int __private *expected, | ||
| 5145 | + int desired); | ||
| 5146 | +bool __ovld | ||
| 5147 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5148 | + uint __global *expected, uint desired); | ||
| 5149 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5150 | + uint __global *expected, | ||
| 5151 | + uint desired); | ||
| 5152 | +bool __ovld | ||
| 5153 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5154 | + uint __local *expected, uint desired); | ||
| 5155 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5156 | + uint __local *expected, | ||
| 5157 | + uint desired); | ||
| 5158 | +bool __ovld | ||
| 5159 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5160 | + uint __private *expected, uint desired); | ||
| 5161 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5162 | + uint __private *expected, | ||
| 5163 | + uint desired); | ||
| 5164 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5165 | + int __global *expected, int desired); | ||
| 5166 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5167 | + int __global *expected, int desired); | ||
| 5168 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5169 | + int __local *expected, int desired); | ||
| 5170 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5171 | + int __local *expected, int desired); | ||
| 5172 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5173 | + int __private *expected, int desired); | ||
| 5174 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5175 | + int __private *expected, int desired); | ||
| 5176 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5177 | + uint __global *expected, uint desired); | ||
| 5178 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5179 | + uint __global *expected, uint desired); | ||
| 5180 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5181 | + uint __local *expected, uint desired); | ||
| 5182 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5183 | + uint __local *expected, uint desired); | ||
| 5184 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5185 | + uint __private *expected, | ||
| 5186 | + uint desired); | ||
| 5187 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5188 | + uint __private *expected, | ||
| 5189 | + uint desired); | ||
| 5190 | +bool __ovld | ||
| 5191 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5192 | + float __global *expected, float desired); | ||
| 5193 | +bool __ovld | ||
| 5194 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5195 | + float __global *expected, float desired); | ||
| 5196 | +bool __ovld | ||
| 5197 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5198 | + float __local *expected, float desired); | ||
| 5199 | +bool __ovld | ||
| 5200 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5201 | + float __local *expected, float desired); | ||
| 5202 | +bool __ovld | ||
| 5203 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5204 | + float __private *expected, float desired); | ||
| 5205 | +bool __ovld | ||
| 5206 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5207 | + float __private *expected, float desired); | ||
| 5208 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5209 | + float __global *expected, | ||
| 5210 | + float desired); | ||
| 5211 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5212 | + float __global *expected, | ||
| 5213 | + float desired); | ||
| 5214 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5215 | + float __local *expected, | ||
| 5216 | + float desired); | ||
| 5217 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5218 | + float __local *expected, | ||
| 5219 | + float desired); | ||
| 5220 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5221 | + float __private *expected, | ||
| 5222 | + float desired); | ||
| 5223 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5224 | + float __private *expected, | ||
| 5225 | + float desired); | ||
| 5226 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5227 | -#ifdef cl_khr_fp64 | ||
| 5228 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_double *object, double *expected, double desired); | ||
| 5229 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_double *object, double *expected, | ||
| 5230 | - double desired, memory_order success, memory_order failure); | ||
| 5231 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_double *object, double *expected, | ||
| 5232 | - double desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5233 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_double *object, double *expected, double desired); | ||
| 5234 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_double *object, double *expected, | ||
| 5235 | - double desired, memory_order success, memory_order failure); | ||
| 5236 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_double *object, double *expected, | ||
| 5237 | - double desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5238 | -#endif //cl_khr_fp64 | ||
| 5239 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_long *object, long *expected, long desired); | ||
| 5240 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_long *object, long *expected, | ||
| 5241 | - long desired, memory_order success, memory_order failure); | ||
| 5242 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_long *object, long *expected, | ||
| 5243 | - long desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5244 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_long *object, long *expected, long desired); | ||
| 5245 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, long *expected, | ||
| 5246 | - long desired, memory_order success, memory_order failure); | ||
| 5247 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, long *expected, | ||
| 5248 | - long desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5249 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_ulong *object, ulong *expected, ulong desired); | ||
| 5250 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5251 | - ulong desired, memory_order success, memory_order failure); | ||
| 5252 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5253 | - ulong desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5254 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong *object, ulong *expected, ulong desired); | ||
| 5255 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5256 | - ulong desired, memory_order success, memory_order failure); | ||
| 5257 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5258 | - ulong desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5259 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5260 | +bool __ovld | ||
| 5261 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5262 | + double __global *expected, double desired); | ||
| 5263 | +bool __ovld | ||
| 5264 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5265 | + double __global *expected, double desired); | ||
| 5266 | +bool __ovld | ||
| 5267 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5268 | + double __local *expected, double desired); | ||
| 5269 | +bool __ovld | ||
| 5270 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5271 | + double __local *expected, double desired); | ||
| 5272 | +bool __ovld | ||
| 5273 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5274 | + double __private *expected, double desired); | ||
| 5275 | +bool __ovld | ||
| 5276 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5277 | + double __private *expected, double desired); | ||
| 5278 | +bool __ovld | ||
| 5279 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5280 | + double __global *expected, double desired); | ||
| 5281 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5282 | + double __global *expected, | ||
| 5283 | + double desired); | ||
| 5284 | +bool __ovld | ||
| 5285 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5286 | + double __local *expected, double desired); | ||
| 5287 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5288 | + double __local *expected, | ||
| 5289 | + double desired); | ||
| 5290 | +bool __ovld | ||
| 5291 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5292 | + double __private *expected, double desired); | ||
| 5293 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5294 | + double __private *expected, | ||
| 5295 | + double desired); | ||
| 5296 | #endif | ||
| 5297 | +bool __ovld | ||
| 5298 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5299 | + long __global *expected, long desired); | ||
| 5300 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5301 | + long __global *expected, | ||
| 5302 | + long desired); | ||
| 5303 | +bool __ovld | ||
| 5304 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5305 | + long __local *expected, long desired); | ||
| 5306 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5307 | + long __local *expected, | ||
| 5308 | + long desired); | ||
| 5309 | +bool __ovld | ||
| 5310 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5311 | + long __private *expected, long desired); | ||
| 5312 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5313 | + long __private *expected, | ||
| 5314 | + long desired); | ||
| 5315 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5316 | + long __global *expected, long desired); | ||
| 5317 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5318 | + long __global *expected, long desired); | ||
| 5319 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5320 | + long __local *expected, long desired); | ||
| 5321 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5322 | + long __local *expected, long desired); | ||
| 5323 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5324 | + long __private *expected, | ||
| 5325 | + long desired); | ||
| 5326 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5327 | + long __private *expected, | ||
| 5328 | + long desired); | ||
| 5329 | +bool __ovld | ||
| 5330 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5331 | + ulong __global *expected, ulong desired); | ||
| 5332 | +bool __ovld | ||
| 5333 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5334 | + ulong __global *expected, ulong desired); | ||
| 5335 | +bool __ovld | ||
| 5336 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5337 | + ulong __local *expected, ulong desired); | ||
| 5338 | +bool __ovld | ||
| 5339 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5340 | + ulong __local *expected, ulong desired); | ||
| 5341 | +bool __ovld | ||
| 5342 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5343 | + ulong __private *expected, ulong desired); | ||
| 5344 | +bool __ovld | ||
| 5345 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5346 | + ulong __private *expected, ulong desired); | ||
| 5347 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5348 | + ulong __global *expected, | ||
| 5349 | + ulong desired); | ||
| 5350 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5351 | + ulong __global *expected, | ||
| 5352 | + ulong desired); | ||
| 5353 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5354 | + ulong __local *expected, | ||
| 5355 | + ulong desired); | ||
| 5356 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5357 | + ulong __local *expected, | ||
| 5358 | + ulong desired); | ||
| 5359 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5360 | + ulong __private *expected, | ||
| 5361 | + ulong desired); | ||
| 5362 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5363 | + ulong __private *expected, | ||
| 5364 | + ulong desired); | ||
| 5365 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5366 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5367 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5368 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5369 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5370 | + | ||
| 5371 | +#ifdef __opencl_c_generic_address_space | ||
| 5372 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5373 | +bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, | ||
| 5374 | + int *expected, int desired, | ||
| 5375 | + memory_order success, | ||
| 5376 | + memory_order failure); | ||
| 5377 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5378 | + volatile atomic_uint *object, uint *expected, uint desired, | ||
| 5379 | + memory_order success, memory_order failure); | ||
| 5380 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, | ||
| 5381 | + int *expected, int desired, | ||
| 5382 | + memory_order success, | ||
| 5383 | + memory_order failure); | ||
| 5384 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, | ||
| 5385 | + uint *expected, uint desired, | ||
| 5386 | + memory_order success, | ||
| 5387 | + memory_order failure); | ||
| 5388 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5389 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5390 | + memory_order success, memory_order failure); | ||
| 5391 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, | ||
| 5392 | + float *expected, | ||
| 5393 | + float desired, | ||
| 5394 | + memory_order success, | ||
| 5395 | + memory_order failure); | ||
| 5396 | +#endif // __opencl_c_atomic_scope_device | ||
| 5397 | +bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, | ||
| 5398 | + int *expected, int desired, | ||
| 5399 | + memory_order success, | ||
| 5400 | + memory_order failure, | ||
| 5401 | + memory_scope scope); | ||
| 5402 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5403 | + volatile atomic_uint *object, uint *expected, uint desired, | ||
| 5404 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5405 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, | ||
| 5406 | + int *expected, int desired, | ||
| 5407 | + memory_order success, | ||
| 5408 | + memory_order failure, | ||
| 5409 | + memory_scope scope); | ||
| 5410 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, | ||
| 5411 | + uint *expected, uint desired, | ||
| 5412 | + memory_order success, | ||
| 5413 | + memory_order failure, | ||
| 5414 | + memory_scope scope); | ||
| 5415 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5416 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5417 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5418 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5419 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5420 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5421 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5422 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5423 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5424 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5425 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5426 | + memory_order success, memory_order failure); | ||
| 5427 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5428 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5429 | + memory_order success, memory_order failure); | ||
| 5430 | +#endif // __opencl_c_atomic_scope_device | ||
| 5431 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5432 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5433 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5434 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5435 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5436 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5437 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5438 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5439 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5440 | + volatile atomic_long *object, long *expected, long desired, | ||
| 5441 | + memory_order success, memory_order failure); | ||
| 5442 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, | ||
| 5443 | + long *expected, long desired, | ||
| 5444 | + memory_order success, | ||
| 5445 | + memory_order failure); | ||
| 5446 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5447 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5448 | + memory_order success, memory_order failure); | ||
| 5449 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, | ||
| 5450 | + ulong *expected, | ||
| 5451 | + ulong desired, | ||
| 5452 | + memory_order success, | ||
| 5453 | + memory_order failure); | ||
| 5454 | +#endif // __opencl_c_atomic_scope_device | ||
| 5455 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5456 | + volatile atomic_long *object, long *expected, long desired, | ||
| 5457 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5458 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, | ||
| 5459 | + long *expected, long desired, | ||
| 5460 | + memory_order success, | ||
| 5461 | + memory_order failure, | ||
| 5462 | + memory_scope scope); | ||
| 5463 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5464 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5465 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5466 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5467 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5468 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5469 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5470 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5471 | +#endif // __opencl_c_generic_address_space | ||
| 5472 | + | ||
| 5473 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5474 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5475 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5476 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5477 | + memory_order success, memory_order failure); | ||
| 5478 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5479 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5480 | + memory_order success, memory_order failure); | ||
| 5481 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5482 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5483 | + memory_order success, memory_order failure); | ||
| 5484 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5485 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5486 | + memory_order success, memory_order failure); | ||
| 5487 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5488 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5489 | + memory_order success, memory_order failure); | ||
| 5490 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5491 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5492 | + memory_order success, memory_order failure); | ||
| 5493 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5494 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5495 | + uint desired, memory_order success, memory_order failure); | ||
| 5496 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5497 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5498 | + memory_order success, memory_order failure); | ||
| 5499 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5500 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5501 | + memory_order success, memory_order failure); | ||
| 5502 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5503 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5504 | + memory_order success, memory_order failure); | ||
| 5505 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5506 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5507 | + uint desired, memory_order success, memory_order failure); | ||
| 5508 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5509 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5510 | + uint desired, memory_order success, memory_order failure); | ||
| 5511 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5512 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5513 | + memory_order success, memory_order failure); | ||
| 5514 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5515 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5516 | + memory_order success, memory_order failure); | ||
| 5517 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5518 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5519 | + memory_order success, memory_order failure); | ||
| 5520 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5521 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5522 | + memory_order success, memory_order failure); | ||
| 5523 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5524 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5525 | + memory_order success, memory_order failure); | ||
| 5526 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5527 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5528 | + memory_order success, memory_order failure); | ||
| 5529 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5530 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5531 | + uint desired, memory_order success, memory_order failure); | ||
| 5532 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5533 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5534 | + memory_order success, memory_order failure); | ||
| 5535 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5536 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5537 | + memory_order success, memory_order failure); | ||
| 5538 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5539 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5540 | + memory_order success, memory_order failure); | ||
| 5541 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5542 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5543 | + uint desired, memory_order success, memory_order failure); | ||
| 5544 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5545 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5546 | + uint desired, memory_order success, memory_order failure); | ||
| 5547 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5548 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5549 | + float desired, memory_order success, memory_order failure); | ||
| 5550 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5551 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5552 | + float desired, memory_order success, memory_order failure); | ||
| 5553 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5554 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5555 | + float desired, memory_order success, memory_order failure); | ||
| 5556 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5557 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5558 | + float desired, memory_order success, memory_order failure); | ||
| 5559 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5560 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5561 | + float desired, memory_order success, memory_order failure); | ||
| 5562 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5563 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5564 | + float desired, memory_order success, memory_order failure); | ||
| 5565 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5566 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5567 | + float desired, memory_order success, memory_order failure); | ||
| 5568 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5569 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5570 | + float desired, memory_order success, memory_order failure); | ||
| 5571 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5572 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5573 | + float desired, memory_order success, memory_order failure); | ||
| 5574 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5575 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5576 | + float desired, memory_order success, memory_order failure); | ||
| 5577 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5578 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5579 | + float desired, memory_order success, memory_order failure); | ||
| 5580 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5581 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5582 | + float desired, memory_order success, memory_order failure); | ||
| 5583 | +#endif // __opencl_c_atomic_scope_device | ||
| 5584 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5585 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5586 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5587 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5588 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5589 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5590 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5591 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5592 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5593 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5594 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5595 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5596 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5597 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5598 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5599 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5600 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5601 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5602 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5603 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5604 | + uint desired, memory_order success, memory_order failure, | ||
| 5605 | + memory_scope scope); | ||
| 5606 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5607 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5608 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5609 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5610 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5611 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5612 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5613 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5614 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5615 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5616 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5617 | + uint desired, memory_order success, memory_order failure, | ||
| 5618 | + memory_scope scope); | ||
| 5619 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5620 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5621 | + uint desired, memory_order success, memory_order failure, | ||
| 5622 | + memory_scope scope); | ||
| 5623 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5624 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5625 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5626 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5627 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5628 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5629 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5630 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5631 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5632 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5633 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5634 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5635 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5636 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5637 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5638 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5639 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5640 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5641 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5642 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5643 | + uint desired, memory_order success, memory_order failure, | ||
| 5644 | + memory_scope scope); | ||
| 5645 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5646 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5647 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5648 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5649 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5650 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5651 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5652 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5653 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5654 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5655 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5656 | + uint desired, memory_order success, memory_order failure, | ||
| 5657 | + memory_scope scope); | ||
| 5658 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5659 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5660 | + uint desired, memory_order success, memory_order failure, | ||
| 5661 | + memory_scope scope); | ||
| 5662 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5663 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5664 | + float desired, memory_order success, memory_order failure, | ||
| 5665 | + memory_scope scope); | ||
| 5666 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5667 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5668 | + float desired, memory_order success, memory_order failure, | ||
| 5669 | + memory_scope scope); | ||
| 5670 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5671 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5672 | + float desired, memory_order success, memory_order failure, | ||
| 5673 | + memory_scope scope); | ||
| 5674 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5675 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5676 | + float desired, memory_order success, memory_order failure, | ||
| 5677 | + memory_scope scope); | ||
| 5678 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5679 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5680 | + float desired, memory_order success, memory_order failure, | ||
| 5681 | + memory_scope scope); | ||
| 5682 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5683 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5684 | + float desired, memory_order success, memory_order failure, | ||
| 5685 | + memory_scope scope); | ||
| 5686 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5687 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5688 | + float desired, memory_order success, memory_order failure, | ||
| 5689 | + memory_scope scope); | ||
| 5690 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5691 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5692 | + float desired, memory_order success, memory_order failure, | ||
| 5693 | + memory_scope scope); | ||
| 5694 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5695 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5696 | + float desired, memory_order success, memory_order failure, | ||
| 5697 | + memory_scope scope); | ||
| 5698 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5699 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5700 | + float desired, memory_order success, memory_order failure, | ||
| 5701 | + memory_scope scope); | ||
| 5702 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5703 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5704 | + float desired, memory_order success, memory_order failure, | ||
| 5705 | + memory_scope scope); | ||
| 5706 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5707 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5708 | + float desired, memory_order success, memory_order failure, | ||
| 5709 | + memory_scope scope); | ||
| 5710 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5711 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5712 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5713 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5714 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5715 | + double desired, memory_order success, memory_order failure); | ||
| 5716 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5717 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5718 | + double desired, memory_order success, memory_order failure); | ||
| 5719 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5720 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5721 | + double desired, memory_order success, memory_order failure); | ||
| 5722 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5723 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5724 | + double desired, memory_order success, memory_order failure); | ||
| 5725 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5726 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5727 | + double desired, memory_order success, memory_order failure); | ||
| 5728 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5729 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5730 | + double desired, memory_order success, memory_order failure); | ||
| 5731 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5732 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5733 | + double desired, memory_order success, memory_order failure); | ||
| 5734 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5735 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5736 | + double desired, memory_order success, memory_order failure); | ||
| 5737 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5738 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5739 | + double desired, memory_order success, memory_order failure); | ||
| 5740 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5741 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5742 | + double desired, memory_order success, memory_order failure); | ||
| 5743 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5744 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5745 | + double desired, memory_order success, memory_order failure); | ||
| 5746 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5747 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5748 | + double desired, memory_order success, memory_order failure); | ||
| 5749 | +#endif // __opencl_c_atomic_scope_device | ||
| 5750 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5751 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5752 | + double desired, memory_order success, memory_order failure, | ||
| 5753 | + memory_scope scope); | ||
| 5754 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5755 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5756 | + double desired, memory_order success, memory_order failure, | ||
| 5757 | + memory_scope scope); | ||
| 5758 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5759 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5760 | + double desired, memory_order success, memory_order failure, | ||
| 5761 | + memory_scope scope); | ||
| 5762 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5763 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5764 | + double desired, memory_order success, memory_order failure, | ||
| 5765 | + memory_scope scope); | ||
| 5766 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5767 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5768 | + double desired, memory_order success, memory_order failure, | ||
| 5769 | + memory_scope scope); | ||
| 5770 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5771 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5772 | + double desired, memory_order success, memory_order failure, | ||
| 5773 | + memory_scope scope); | ||
| 5774 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5775 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5776 | + double desired, memory_order success, memory_order failure, | ||
| 5777 | + memory_scope scope); | ||
| 5778 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5779 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5780 | + double desired, memory_order success, memory_order failure, | ||
| 5781 | + memory_scope scope); | ||
| 5782 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5783 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5784 | + double desired, memory_order success, memory_order failure, | ||
| 5785 | + memory_scope scope); | ||
| 5786 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5787 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5788 | + double desired, memory_order success, memory_order failure, | ||
| 5789 | + memory_scope scope); | ||
| 5790 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5791 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5792 | + double desired, memory_order success, memory_order failure, | ||
| 5793 | + memory_scope scope); | ||
| 5794 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5795 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5796 | + double desired, memory_order success, memory_order failure, | ||
| 5797 | + memory_scope scope); | ||
| 5798 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5799 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5800 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5801 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5802 | + long desired, memory_order success, memory_order failure); | ||
| 5803 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5804 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5805 | + memory_order success, memory_order failure); | ||
| 5806 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5807 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5808 | + memory_order success, memory_order failure); | ||
| 5809 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5810 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5811 | + memory_order success, memory_order failure); | ||
| 5812 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5813 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5814 | + long desired, memory_order success, memory_order failure); | ||
| 5815 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5816 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5817 | + long desired, memory_order success, memory_order failure); | ||
| 5818 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5819 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5820 | + long desired, memory_order success, memory_order failure); | ||
| 5821 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5822 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5823 | + memory_order success, memory_order failure); | ||
| 5824 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5825 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5826 | + memory_order success, memory_order failure); | ||
| 5827 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5828 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5829 | + memory_order success, memory_order failure); | ||
| 5830 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5831 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5832 | + long desired, memory_order success, memory_order failure); | ||
| 5833 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5834 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5835 | + long desired, memory_order success, memory_order failure); | ||
| 5836 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5837 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5838 | + ulong desired, memory_order success, memory_order failure); | ||
| 5839 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5840 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5841 | + ulong desired, memory_order success, memory_order failure); | ||
| 5842 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5843 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5844 | + ulong desired, memory_order success, memory_order failure); | ||
| 5845 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5846 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5847 | + ulong desired, memory_order success, memory_order failure); | ||
| 5848 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5849 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5850 | + ulong desired, memory_order success, memory_order failure); | ||
| 5851 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5852 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5853 | + ulong desired, memory_order success, memory_order failure); | ||
| 5854 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5855 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5856 | + ulong desired, memory_order success, memory_order failure); | ||
| 5857 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5858 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5859 | + ulong desired, memory_order success, memory_order failure); | ||
| 5860 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5861 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5862 | + ulong desired, memory_order success, memory_order failure); | ||
| 5863 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5864 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5865 | + ulong desired, memory_order success, memory_order failure); | ||
| 5866 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5867 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5868 | + ulong desired, memory_order success, memory_order failure); | ||
| 5869 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5870 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5871 | + ulong desired, memory_order success, memory_order failure); | ||
| 5872 | +#endif // __opencl_c_atomic_scope_device | ||
| 5873 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5874 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5875 | + long desired, memory_order success, memory_order failure, | ||
| 5876 | + memory_scope scope); | ||
| 5877 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5878 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5879 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5880 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5881 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5882 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5883 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5884 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5885 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5886 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5887 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5888 | + long desired, memory_order success, memory_order failure, | ||
| 5889 | + memory_scope scope); | ||
| 5890 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5891 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5892 | + long desired, memory_order success, memory_order failure, | ||
| 5893 | + memory_scope scope); | ||
| 5894 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5895 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5896 | + long desired, memory_order success, memory_order failure, | ||
| 5897 | + memory_scope scope); | ||
| 5898 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5899 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5900 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5901 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5902 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5903 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5904 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5905 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5906 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5907 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5908 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5909 | + long desired, memory_order success, memory_order failure, | ||
| 5910 | + memory_scope scope); | ||
| 5911 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5912 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5913 | + long desired, memory_order success, memory_order failure, | ||
| 5914 | + memory_scope scope); | ||
| 5915 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5916 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5917 | + ulong desired, memory_order success, memory_order failure, | ||
| 5918 | + memory_scope scope); | ||
| 5919 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5920 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5921 | + ulong desired, memory_order success, memory_order failure, | ||
| 5922 | + memory_scope scope); | ||
| 5923 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5924 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5925 | + ulong desired, memory_order success, memory_order failure, | ||
| 5926 | + memory_scope scope); | ||
| 5927 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5928 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5929 | + ulong desired, memory_order success, memory_order failure, | ||
| 5930 | + memory_scope scope); | ||
| 5931 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5932 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5933 | + ulong desired, memory_order success, memory_order failure, | ||
| 5934 | + memory_scope scope); | ||
| 5935 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5936 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5937 | + ulong desired, memory_order success, memory_order failure, | ||
| 5938 | + memory_scope scope); | ||
| 5939 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5940 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5941 | + ulong desired, memory_order success, memory_order failure, | ||
| 5942 | + memory_scope scope); | ||
| 5943 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5944 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5945 | + ulong desired, memory_order success, memory_order failure, | ||
| 5946 | + memory_scope scope); | ||
| 5947 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5948 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5949 | + ulong desired, memory_order success, memory_order failure, | ||
| 5950 | + memory_scope scope); | ||
| 5951 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5952 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5953 | + ulong desired, memory_order success, memory_order failure, | ||
| 5954 | + memory_scope scope); | ||
| 5955 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5956 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5957 | + ulong desired, memory_order success, memory_order failure, | ||
| 5958 | + memory_scope scope); | ||
| 5959 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5960 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5961 | + ulong desired, memory_order success, memory_order failure, | ||
| 5962 | + memory_scope scope); | ||
| 5963 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5964 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5965 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5966 | |||
| 5967 | // atomic_flag_test_and_set() and atomic_flag_clear() | ||
| 5968 | - | ||
| 5969 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5970 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5971 | +#ifdef __opencl_c_generic_address_space | ||
| 5972 | bool __ovld atomic_flag_test_and_set(volatile atomic_flag *object); | ||
| 5973 | -bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, memory_order order); | ||
| 5974 | -bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, memory_order order, memory_scope scope); | ||
| 5975 | void __ovld atomic_flag_clear(volatile atomic_flag *object); | ||
| 5976 | -void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, memory_order order); | ||
| 5977 | -void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, memory_order order, memory_scope scope); | ||
| 5978 | +#endif // __opencl_c_generic_address_space | ||
| 5979 | + | ||
| 5980 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5981 | +bool __ovld atomic_flag_test_and_set(volatile atomic_flag __global *object); | ||
| 5982 | +bool __ovld atomic_flag_test_and_set(volatile atomic_flag __local *object); | ||
| 5983 | +void __ovld atomic_flag_clear(volatile atomic_flag __global *object); | ||
| 5984 | +void __ovld atomic_flag_clear(volatile atomic_flag __local *object); | ||
| 5985 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5986 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5987 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5988 | + | ||
| 5989 | +#ifdef __opencl_c_generic_address_space | ||
| 5990 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5991 | +bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, | ||
| 5992 | + memory_order order); | ||
| 5993 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, | ||
| 5994 | + memory_order order); | ||
| 5995 | +#endif // __opencl_c_atomic_scope_device | ||
| 5996 | +bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, | ||
| 5997 | + memory_order order, | ||
| 5998 | + memory_scope scope); | ||
| 5999 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, | ||
| 6000 | + memory_order order, memory_scope scope); | ||
| 6001 | +#endif // __opencl_c_generic_address_space | ||
| 6002 | + | ||
| 6003 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 6004 | +#ifdef __opencl_c_atomic_scope_device | ||
| 6005 | +bool __ovld atomic_flag_test_and_set_explicit( | ||
| 6006 | + volatile atomic_flag __global *object, memory_order order); | ||
| 6007 | +bool __ovld atomic_flag_test_and_set_explicit( | ||
| 6008 | + volatile atomic_flag __local *object, memory_order order); | ||
| 6009 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __global *object, | ||
| 6010 | + memory_order order); | ||
| 6011 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __local *object, | ||
| 6012 | + memory_order order); | ||
| 6013 | +#endif // __opencl_c_atomic_scope_device | ||
| 6014 | +bool __ovld | ||
| 6015 | +atomic_flag_test_and_set_explicit(volatile atomic_flag __global *object, | ||
| 6016 | + memory_order order, memory_scope scope); | ||
| 6017 | +bool __ovld | ||
| 6018 | +atomic_flag_test_and_set_explicit(volatile atomic_flag __local *object, | ||
| 6019 | + memory_order order, memory_scope scope); | ||
| 6020 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __global *object, | ||
| 6021 | + memory_order order, memory_scope scope); | ||
| 6022 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __local *object, | ||
| 6023 | + memory_order order, memory_scope scope); | ||
| 6024 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 6025 | |||
| 6026 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6027 | |||
| 6028 | @@ -13918,7 +15943,7 @@ float16 __ovld __cnfn shuffle(float4 x, uint16 mask); | ||
| 6029 | float16 __ovld __cnfn shuffle(float8 x, uint16 mask); | ||
| 6030 | float16 __ovld __cnfn shuffle(float16 x, uint16 mask); | ||
| 6031 | |||
| 6032 | -#ifdef cl_khr_fp64 | ||
| 6033 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6034 | double2 __ovld __cnfn shuffle(double2 x, ulong2 mask); | ||
| 6035 | double2 __ovld __cnfn shuffle(double4 x, ulong2 mask); | ||
| 6036 | double2 __ovld __cnfn shuffle(double8 x, ulong2 mask); | ||
| 6037 | @@ -13938,7 +15963,7 @@ double16 __ovld __cnfn shuffle(double2 x, ulong16 mask); | ||
| 6038 | double16 __ovld __cnfn shuffle(double4 x, ulong16 mask); | ||
| 6039 | double16 __ovld __cnfn shuffle(double8 x, ulong16 mask); | ||
| 6040 | double16 __ovld __cnfn shuffle(double16 x, ulong16 mask); | ||
| 6041 | -#endif //cl_khr_fp64 | ||
| 6042 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6043 | |||
| 6044 | #ifdef cl_khr_fp16 | ||
| 6045 | half2 __ovld __cnfn shuffle(half2 x, ushort2 mask); | ||
| 6046 | @@ -14142,7 +16167,7 @@ float16 __ovld __cnfn shuffle2(float4 x, float4 y, uint16 mask); | ||
| 6047 | float16 __ovld __cnfn shuffle2(float8 x, float8 y, uint16 mask); | ||
| 6048 | float16 __ovld __cnfn shuffle2(float16 x, float16 y, uint16 mask); | ||
| 6049 | |||
| 6050 | -#ifdef cl_khr_fp64 | ||
| 6051 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6052 | double2 __ovld __cnfn shuffle2(double2 x, double2 y, ulong2 mask); | ||
| 6053 | double2 __ovld __cnfn shuffle2(double4 x, double4 y, ulong2 mask); | ||
| 6054 | double2 __ovld __cnfn shuffle2(double8 x, double8 y, ulong2 mask); | ||
| 6055 | @@ -14162,7 +16187,7 @@ double16 __ovld __cnfn shuffle2(double2 x, double2 y, ulong16 mask); | ||
| 6056 | double16 __ovld __cnfn shuffle2(double4 x, double4 y, ulong16 mask); | ||
| 6057 | double16 __ovld __cnfn shuffle2(double8 x, double8 y, ulong16 mask); | ||
| 6058 | double16 __ovld __cnfn shuffle2(double16 x, double16 y, ulong16 mask); | ||
| 6059 | -#endif //cl_khr_fp64 | ||
| 6060 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6061 | |||
| 6062 | #ifdef cl_khr_fp16 | ||
| 6063 | half2 __ovld __cnfn shuffle2(half2 x, half2 y, ushort2 mask); | ||
| 6064 | @@ -14198,6 +16223,7 @@ int printf(__constant const char* st, ...) __attribute__((format(printf, 1, 2))) | ||
| 6065 | #pragma OPENCL EXTENSION cl_khr_gl_msaa_sharing : enable | ||
| 6066 | #endif //cl_khr_gl_msaa_sharing | ||
| 6067 | |||
| 6068 | +#ifdef __opencl_c_images | ||
| 6069 | /** | ||
| 6070 | * Use the coordinate (coord.xy) to do an element lookup in | ||
| 6071 | * the 2D image object specified by image. | ||
| 6072 | @@ -14476,6 +16502,7 @@ half4 __purefn __ovld read_imageh(read_only image1d_buffer_t image, int coord); | ||
| 6073 | |||
| 6074 | // Image read functions for read_write images | ||
| 6075 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6076 | +#ifdef __opencl_c_read_write_images | ||
| 6077 | float4 __purefn __ovld read_imagef(read_write image1d_t image, int coord); | ||
| 6078 | int4 __purefn __ovld read_imagei(read_write image1d_t image, int coord); | ||
| 6079 | uint4 __purefn __ovld read_imageui(read_write image1d_t image, int coord); | ||
| 6080 | @@ -14519,6 +16546,7 @@ float __purefn __ovld read_imagef(read_write image2d_array_msaa_depth_t image, i | ||
| 6081 | #endif //cl_khr_gl_msaa_sharing | ||
| 6082 | |||
| 6083 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6084 | +#ifdef __opencl_c_read_write_images | ||
| 6085 | #ifdef cl_khr_mipmap_image | ||
| 6086 | float4 __purefn __ovld read_imagef(read_write image1d_t image, sampler_t sampler, float coord, float lod); | ||
| 6087 | int4 __purefn __ovld read_imagei(read_write image1d_t image, sampler_t sampler, float coord, float lod); | ||
| 6088 | @@ -14569,6 +16597,7 @@ int4 __purefn __ovld read_imagei(read_write image3d_t image, sampler_t sampler, | ||
| 6089 | uint4 __purefn __ovld read_imageui(read_write image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY); | ||
| 6090 | |||
| 6091 | #endif //cl_khr_mipmap_image | ||
| 6092 | +#endif //__opencl_c_read_write_images | ||
| 6093 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6094 | |||
| 6095 | // Image read functions returning half4 type | ||
| 6096 | @@ -14580,6 +16609,7 @@ half4 __purefn __ovld read_imageh(read_write image1d_array_t image, int2 coord); | ||
| 6097 | half4 __purefn __ovld read_imageh(read_write image2d_array_t image, int4 coord); | ||
| 6098 | half4 __purefn __ovld read_imageh(read_write image1d_buffer_t image, int coord); | ||
| 6099 | #endif //cl_khr_fp16 | ||
| 6100 | +#endif //__opencl_c_read_write_images | ||
| 6101 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6102 | |||
| 6103 | /** | ||
| 6104 | @@ -14669,7 +16699,7 @@ void __ovld write_imagef(write_only image1d_array_t image_array, int2 coord, flo | ||
| 6105 | void __ovld write_imagei(write_only image1d_array_t image_array, int2 coord, int4 color); | ||
| 6106 | void __ovld write_imageui(write_only image1d_array_t image_array, int2 coord, uint4 color); | ||
| 6107 | |||
| 6108 | -#ifdef cl_khr_3d_image_writes | ||
| 6109 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6110 | void __ovld write_imagef(write_only image3d_t image, int4 coord, float4 color); | ||
| 6111 | void __ovld write_imagei(write_only image3d_t image, int4 coord, int4 color); | ||
| 6112 | void __ovld write_imageui(write_only image3d_t image, int4 coord, uint4 color); | ||
| 6113 | @@ -14702,7 +16732,7 @@ void __ovld write_imageui(write_only image2d_array_t image_array, int4 coord, in | ||
| 6114 | void __ovld write_imagef(write_only image2d_depth_t image, int2 coord, int lod, float depth); | ||
| 6115 | void __ovld write_imagef(write_only image2d_array_depth_t image, int4 coord, int lod, float depth); | ||
| 6116 | |||
| 6117 | -#ifdef cl_khr_3d_image_writes | ||
| 6118 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6119 | void __ovld write_imagef(write_only image3d_t image, int4 coord, int lod, float4 color); | ||
| 6120 | void __ovld write_imagei(write_only image3d_t image, int4 coord, int lod, int4 color); | ||
| 6121 | void __ovld write_imageui(write_only image3d_t image, int4 coord, int lod, uint4 color); | ||
| 6122 | @@ -14715,7 +16745,7 @@ void __ovld write_imageui(write_only image3d_t image, int4 coord, int lod, uint4 | ||
| 6123 | #ifdef cl_khr_fp16 | ||
| 6124 | void __ovld write_imageh(write_only image1d_t image, int coord, half4 color); | ||
| 6125 | void __ovld write_imageh(write_only image2d_t image, int2 coord, half4 color); | ||
| 6126 | -#ifdef cl_khr_3d_image_writes | ||
| 6127 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6128 | void __ovld write_imageh(write_only image3d_t image, int4 coord, half4 color); | ||
| 6129 | #endif | ||
| 6130 | void __ovld write_imageh(write_only image1d_array_t image, int2 coord, half4 color); | ||
| 6131 | @@ -14725,6 +16755,7 @@ void __ovld write_imageh(write_only image1d_buffer_t image, int coord, half4 col | ||
| 6132 | |||
| 6133 | // Image write functions for read_write images | ||
| 6134 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6135 | +#ifdef __opencl_c_read_write_images | ||
| 6136 | void __ovld write_imagef(read_write image2d_t image, int2 coord, float4 color); | ||
| 6137 | void __ovld write_imagei(read_write image2d_t image, int2 coord, int4 color); | ||
| 6138 | void __ovld write_imageui(read_write image2d_t image, int2 coord, uint4 color); | ||
| 6139 | @@ -14745,7 +16776,7 @@ void __ovld write_imagef(read_write image1d_array_t image_array, int2 coord, flo | ||
| 6140 | void __ovld write_imagei(read_write image1d_array_t image_array, int2 coord, int4 color); | ||
| 6141 | void __ovld write_imageui(read_write image1d_array_t image_array, int2 coord, uint4 color); | ||
| 6142 | |||
| 6143 | -#ifdef cl_khr_3d_image_writes | ||
| 6144 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6145 | void __ovld write_imagef(read_write image3d_t image, int4 coord, float4 color); | ||
| 6146 | void __ovld write_imagei(read_write image3d_t image, int4 coord, int4 color); | ||
| 6147 | void __ovld write_imageui(read_write image3d_t image, int4 coord, uint4 color); | ||
| 6148 | @@ -14777,7 +16808,7 @@ void __ovld write_imageui(read_write image2d_array_t image_array, int4 coord, in | ||
| 6149 | void __ovld write_imagef(read_write image2d_depth_t image, int2 coord, int lod, float color); | ||
| 6150 | void __ovld write_imagef(read_write image2d_array_depth_t image, int4 coord, int lod, float color); | ||
| 6151 | |||
| 6152 | -#ifdef cl_khr_3d_image_writes | ||
| 6153 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6154 | void __ovld write_imagef(read_write image3d_t image, int4 coord, int lod, float4 color); | ||
| 6155 | void __ovld write_imagei(read_write image3d_t image, int4 coord, int lod, int4 color); | ||
| 6156 | void __ovld write_imageui(read_write image3d_t image, int4 coord, int lod, uint4 color); | ||
| 6157 | @@ -14790,13 +16821,14 @@ void __ovld write_imageui(read_write image3d_t image, int4 coord, int lod, uint4 | ||
| 6158 | #ifdef cl_khr_fp16 | ||
| 6159 | void __ovld write_imageh(read_write image1d_t image, int coord, half4 color); | ||
| 6160 | void __ovld write_imageh(read_write image2d_t image, int2 coord, half4 color); | ||
| 6161 | -#ifdef cl_khr_3d_image_writes | ||
| 6162 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6163 | void __ovld write_imageh(read_write image3d_t image, int4 coord, half4 color); | ||
| 6164 | #endif | ||
| 6165 | void __ovld write_imageh(read_write image1d_array_t image, int2 coord, half4 color); | ||
| 6166 | void __ovld write_imageh(read_write image2d_array_t image, int4 coord, half4 color); | ||
| 6167 | void __ovld write_imageh(read_write image1d_buffer_t image, int coord, half4 color); | ||
| 6168 | #endif //cl_khr_fp16 | ||
| 6169 | +#endif //__opencl_c_read_write_images | ||
| 6170 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6171 | |||
| 6172 | // Note: In OpenCL v1.0/1.1/1.2, image argument of image query builtin functions does not have | ||
| 6173 | @@ -14810,7 +16842,7 @@ void __ovld write_imageh(read_write image1d_buffer_t image, int coord, half4 col | ||
| 6174 | int __ovld __cnfn get_image_width(read_only image1d_t image); | ||
| 6175 | int __ovld __cnfn get_image_width(read_only image1d_buffer_t image); | ||
| 6176 | int __ovld __cnfn get_image_width(read_only image2d_t image); | ||
| 6177 | -#ifdef cl_khr_3d_image_writes | ||
| 6178 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6179 | int __ovld __cnfn get_image_width(read_only image3d_t image); | ||
| 6180 | #endif | ||
| 6181 | int __ovld __cnfn get_image_width(read_only image1d_array_t image); | ||
| 6182 | @@ -14829,7 +16861,7 @@ int __ovld __cnfn get_image_width(read_only image2d_array_msaa_depth_t image); | ||
| 6183 | int __ovld __cnfn get_image_width(write_only image1d_t image); | ||
| 6184 | int __ovld __cnfn get_image_width(write_only image1d_buffer_t image); | ||
| 6185 | int __ovld __cnfn get_image_width(write_only image2d_t image); | ||
| 6186 | -#ifdef cl_khr_3d_image_writes | ||
| 6187 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6188 | int __ovld __cnfn get_image_width(write_only image3d_t image); | ||
| 6189 | #endif | ||
| 6190 | int __ovld __cnfn get_image_width(write_only image1d_array_t image); | ||
| 6191 | @@ -14846,6 +16878,7 @@ int __ovld __cnfn get_image_width(write_only image2d_array_msaa_depth_t image); | ||
| 6192 | #endif //cl_khr_gl_msaa_sharing | ||
| 6193 | |||
| 6194 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6195 | +#ifdef __opencl_c_read_write_images | ||
| 6196 | int __ovld __cnfn get_image_width(read_write image1d_t image); | ||
| 6197 | int __ovld __cnfn get_image_width(read_write image1d_buffer_t image); | ||
| 6198 | int __ovld __cnfn get_image_width(read_write image2d_t image); | ||
| 6199 | @@ -14862,6 +16895,7 @@ int __ovld __cnfn get_image_width(read_write image2d_msaa_depth_t image); | ||
| 6200 | int __ovld __cnfn get_image_width(read_write image2d_array_msaa_t image); | ||
| 6201 | int __ovld __cnfn get_image_width(read_write image2d_array_msaa_depth_t image); | ||
| 6202 | #endif //cl_khr_gl_msaa_sharing | ||
| 6203 | +#endif //__opencl_c_read_write_images | ||
| 6204 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6205 | |||
| 6206 | /** | ||
| 6207 | @@ -14882,7 +16916,7 @@ int __ovld __cnfn get_image_height(read_only image2d_array_msaa_depth_t image); | ||
| 6208 | #endif //cl_khr_gl_msaa_sharing | ||
| 6209 | |||
| 6210 | int __ovld __cnfn get_image_height(write_only image2d_t image); | ||
| 6211 | -#ifdef cl_khr_3d_image_writes | ||
| 6212 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6213 | int __ovld __cnfn get_image_height(write_only image3d_t image); | ||
| 6214 | #endif | ||
| 6215 | int __ovld __cnfn get_image_height(write_only image2d_array_t image); | ||
| 6216 | @@ -14898,6 +16932,7 @@ int __ovld __cnfn get_image_height(write_only image2d_array_msaa_depth_t image); | ||
| 6217 | #endif //cl_khr_gl_msaa_sharing | ||
| 6218 | |||
| 6219 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6220 | +#ifdef __opencl_c_read_write_images | ||
| 6221 | int __ovld __cnfn get_image_height(read_write image2d_t image); | ||
| 6222 | int __ovld __cnfn get_image_height(read_write image3d_t image); | ||
| 6223 | int __ovld __cnfn get_image_height(read_write image2d_array_t image); | ||
| 6224 | @@ -14911,6 +16946,7 @@ int __ovld __cnfn get_image_height(read_write image2d_msaa_depth_t image); | ||
| 6225 | int __ovld __cnfn get_image_height(read_write image2d_array_msaa_t image); | ||
| 6226 | int __ovld __cnfn get_image_height(read_write image2d_array_msaa_depth_t image); | ||
| 6227 | #endif //cl_khr_gl_msaa_sharing | ||
| 6228 | +#endif //__opencl_c_read_write_images | ||
| 6229 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6230 | |||
| 6231 | /** | ||
| 6232 | @@ -14918,12 +16954,14 @@ int __ovld __cnfn get_image_height(read_write image2d_array_msaa_depth_t image); | ||
| 6233 | */ | ||
| 6234 | int __ovld __cnfn get_image_depth(read_only image3d_t image); | ||
| 6235 | |||
| 6236 | -#ifdef cl_khr_3d_image_writes | ||
| 6237 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6238 | int __ovld __cnfn get_image_depth(write_only image3d_t image); | ||
| 6239 | #endif | ||
| 6240 | |||
| 6241 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6242 | +#ifdef __opencl_c_read_write_images | ||
| 6243 | int __ovld __cnfn get_image_depth(read_write image3d_t image); | ||
| 6244 | +#endif //__opencl_c_read_write_images | ||
| 6245 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6246 | |||
| 6247 | // OpenCL Extension v2.0 s9.18 - Mipmaps | ||
| 6248 | @@ -14939,13 +16977,15 @@ int __ovld get_image_num_mip_levels(read_only image3d_t image); | ||
| 6249 | |||
| 6250 | int __ovld get_image_num_mip_levels(write_only image1d_t image); | ||
| 6251 | int __ovld get_image_num_mip_levels(write_only image2d_t image); | ||
| 6252 | -#ifdef cl_khr_3d_image_writes | ||
| 6253 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6254 | int __ovld get_image_num_mip_levels(write_only image3d_t image); | ||
| 6255 | #endif | ||
| 6256 | |||
| 6257 | +#ifdef __opencl_c_read_write_images | ||
| 6258 | int __ovld get_image_num_mip_levels(read_write image1d_t image); | ||
| 6259 | int __ovld get_image_num_mip_levels(read_write image2d_t image); | ||
| 6260 | int __ovld get_image_num_mip_levels(read_write image3d_t image); | ||
| 6261 | +#endif //__opencl_c_read_write_images | ||
| 6262 | |||
| 6263 | int __ovld get_image_num_mip_levels(read_only image1d_array_t image); | ||
| 6264 | int __ovld get_image_num_mip_levels(read_only image2d_array_t image); | ||
| 6265 | @@ -14957,10 +16997,12 @@ int __ovld get_image_num_mip_levels(write_only image2d_array_t image); | ||
| 6266 | int __ovld get_image_num_mip_levels(write_only image2d_array_depth_t image); | ||
| 6267 | int __ovld get_image_num_mip_levels(write_only image2d_depth_t image); | ||
| 6268 | |||
| 6269 | +#ifdef __opencl_c_read_write_images | ||
| 6270 | int __ovld get_image_num_mip_levels(read_write image1d_array_t image); | ||
| 6271 | int __ovld get_image_num_mip_levels(read_write image2d_array_t image); | ||
| 6272 | int __ovld get_image_num_mip_levels(read_write image2d_array_depth_t image); | ||
| 6273 | int __ovld get_image_num_mip_levels(read_write image2d_depth_t image); | ||
| 6274 | +#endif //__opencl_c_read_write_images | ||
| 6275 | |||
| 6276 | #endif //cl_khr_mipmap_image | ||
| 6277 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6278 | @@ -15004,7 +17046,7 @@ int __ovld __cnfn get_image_channel_data_type(read_only image2d_array_msaa_depth | ||
| 6279 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_t image); | ||
| 6280 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_buffer_t image); | ||
| 6281 | int __ovld __cnfn get_image_channel_data_type(write_only image2d_t image); | ||
| 6282 | -#ifdef cl_khr_3d_image_writes | ||
| 6283 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6284 | int __ovld __cnfn get_image_channel_data_type(write_only image3d_t image); | ||
| 6285 | #endif | ||
| 6286 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_array_t image); | ||
| 6287 | @@ -15021,6 +17063,7 @@ int __ovld __cnfn get_image_channel_data_type(write_only image2d_array_msaa_dept | ||
| 6288 | #endif //cl_khr_gl_msaa_sharing | ||
| 6289 | |||
| 6290 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6291 | +#ifdef __opencl_c_read_write_images | ||
| 6292 | int __ovld __cnfn get_image_channel_data_type(read_write image1d_t image); | ||
| 6293 | int __ovld __cnfn get_image_channel_data_type(read_write image1d_buffer_t image); | ||
| 6294 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_t image); | ||
| 6295 | @@ -15037,6 +17080,7 @@ int __ovld __cnfn get_image_channel_data_type(read_write image2d_msaa_depth_t im | ||
| 6296 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_array_msaa_t image); | ||
| 6297 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_array_msaa_depth_t image); | ||
| 6298 | #endif //cl_khr_gl_msaa_sharing | ||
| 6299 | +#endif //__opencl_c_read_write_images | ||
| 6300 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6301 | |||
| 6302 | /** | ||
| 6303 | @@ -15076,7 +17120,7 @@ int __ovld __cnfn get_image_channel_order(read_only image2d_array_msaa_depth_t i | ||
| 6304 | int __ovld __cnfn get_image_channel_order(write_only image1d_t image); | ||
| 6305 | int __ovld __cnfn get_image_channel_order(write_only image1d_buffer_t image); | ||
| 6306 | int __ovld __cnfn get_image_channel_order(write_only image2d_t image); | ||
| 6307 | -#ifdef cl_khr_3d_image_writes | ||
| 6308 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6309 | int __ovld __cnfn get_image_channel_order(write_only image3d_t image); | ||
| 6310 | #endif | ||
| 6311 | int __ovld __cnfn get_image_channel_order(write_only image1d_array_t image); | ||
| 6312 | @@ -15093,6 +17137,7 @@ int __ovld __cnfn get_image_channel_order(write_only image2d_array_msaa_depth_t | ||
| 6313 | #endif //cl_khr_gl_msaa_sharing | ||
| 6314 | |||
| 6315 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6316 | +#ifdef __opencl_c_read_write_images | ||
| 6317 | int __ovld __cnfn get_image_channel_order(read_write image1d_t image); | ||
| 6318 | int __ovld __cnfn get_image_channel_order(read_write image1d_buffer_t image); | ||
| 6319 | int __ovld __cnfn get_image_channel_order(read_write image2d_t image); | ||
| 6320 | @@ -15109,6 +17154,7 @@ int __ovld __cnfn get_image_channel_order(read_write image2d_msaa_depth_t image) | ||
| 6321 | int __ovld __cnfn get_image_channel_order(read_write image2d_array_msaa_t image); | ||
| 6322 | int __ovld __cnfn get_image_channel_order(read_write image2d_array_msaa_depth_t image); | ||
| 6323 | #endif //cl_khr_gl_msaa_sharing | ||
| 6324 | +#endif //__opencl_c_read_write_images | ||
| 6325 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6326 | |||
| 6327 | /** | ||
| 6328 | @@ -15143,6 +17189,7 @@ int2 __ovld __cnfn get_image_dim(write_only image2d_array_msaa_depth_t image); | ||
| 6329 | #endif //cl_khr_gl_msaa_sharing | ||
| 6330 | |||
| 6331 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6332 | +#ifdef __opencl_c_read_write_images | ||
| 6333 | int2 __ovld __cnfn get_image_dim(read_write image2d_t image); | ||
| 6334 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_t image); | ||
| 6335 | #ifdef cl_khr_depth_images | ||
| 6336 | @@ -15155,6 +17202,7 @@ int2 __ovld __cnfn get_image_dim(read_write image2d_msaa_depth_t image); | ||
| 6337 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_t image); | ||
| 6338 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_depth_t image); | ||
| 6339 | #endif //cl_khr_gl_msaa_sharing | ||
| 6340 | +#endif //__opencl_c_read_write_images | ||
| 6341 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6342 | |||
| 6343 | /** | ||
| 6344 | @@ -15164,11 +17212,13 @@ int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_depth_t image); | ||
| 6345 | * component and the w component is 0. | ||
| 6346 | */ | ||
| 6347 | int4 __ovld __cnfn get_image_dim(read_only image3d_t image); | ||
| 6348 | -#ifdef cl_khr_3d_image_writes | ||
| 6349 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6350 | int4 __ovld __cnfn get_image_dim(write_only image3d_t image); | ||
| 6351 | #endif | ||
| 6352 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6353 | +#ifdef __opencl_c_read_write_images | ||
| 6354 | int4 __ovld __cnfn get_image_dim(read_write image3d_t image); | ||
| 6355 | +#endif //__opencl_c_read_write_images | ||
| 6356 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6357 | |||
| 6358 | /** | ||
| 6359 | @@ -15196,6 +17246,7 @@ size_t __ovld __cnfn get_image_array_size(write_only image2d_array_msaa_depth_t | ||
| 6360 | #endif //cl_khr_gl_msaa_sharing | ||
| 6361 | |||
| 6362 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6363 | +#ifdef __opencl_c_read_write_images | ||
| 6364 | size_t __ovld __cnfn get_image_array_size(read_write image1d_array_t image_array); | ||
| 6365 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_t image_array); | ||
| 6366 | #ifdef cl_khr_depth_images | ||
| 6367 | @@ -15205,6 +17256,7 @@ size_t __ovld __cnfn get_image_array_size(read_write image2d_array_depth_t image | ||
| 6368 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_msaa_t image_array); | ||
| 6369 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_msaa_depth_t image_array); | ||
| 6370 | #endif //cl_khr_gl_msaa_sharing | ||
| 6371 | +#endif //__opencl_c_read_write_images | ||
| 6372 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6373 | |||
| 6374 | /** | ||
| 6375 | @@ -15222,16 +17274,21 @@ int __ovld get_image_num_samples(write_only image2d_array_msaa_t image); | ||
| 6376 | int __ovld get_image_num_samples(write_only image2d_array_msaa_depth_t image); | ||
| 6377 | |||
| 6378 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6379 | +#ifdef __opencl_c_read_write_images | ||
| 6380 | int __ovld get_image_num_samples(read_write image2d_msaa_t image); | ||
| 6381 | int __ovld get_image_num_samples(read_write image2d_msaa_depth_t image); | ||
| 6382 | int __ovld get_image_num_samples(read_write image2d_array_msaa_t image); | ||
| 6383 | int __ovld get_image_num_samples(read_write image2d_array_msaa_depth_t image); | ||
| 6384 | +#endif //__opencl_c_read_write_images | ||
| 6385 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6386 | #endif | ||
| 6387 | |||
| 6388 | +#endif //__opencl_c_images | ||
| 6389 | + | ||
| 6390 | // OpenCL v2.0 s6.13.15 - Work-group Functions | ||
| 6391 | |||
| 6392 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6393 | +#ifdef __opencl_c_work_group_collective_functions | ||
| 6394 | int __ovld __conv work_group_all(int predicate); | ||
| 6395 | int __ovld __conv work_group_any(int predicate); | ||
| 6396 | |||
| 6397 | @@ -15255,11 +17312,11 @@ ulong __ovld __conv work_group_broadcast(ulong a, size_t x, size_t y, size_t z); | ||
| 6398 | float __ovld __conv work_group_broadcast(float a, size_t local_id); | ||
| 6399 | float __ovld __conv work_group_broadcast(float a, size_t x, size_t y); | ||
| 6400 | float __ovld __conv work_group_broadcast(float a, size_t x, size_t y, size_t z); | ||
| 6401 | -#ifdef cl_khr_fp64 | ||
| 6402 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6403 | double __ovld __conv work_group_broadcast(double a, size_t local_id); | ||
| 6404 | double __ovld __conv work_group_broadcast(double a, size_t x, size_t y); | ||
| 6405 | double __ovld __conv work_group_broadcast(double a, size_t x, size_t y, size_t z); | ||
| 6406 | -#endif //cl_khr_fp64 | ||
| 6407 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6408 | |||
| 6409 | #ifdef cl_khr_fp16 | ||
| 6410 | half __ovld __conv work_group_reduce_add(half x); | ||
| 6411 | @@ -15317,7 +17374,7 @@ float __ovld __conv work_group_scan_exclusive_max(float x); | ||
| 6412 | float __ovld __conv work_group_scan_inclusive_add(float x); | ||
| 6413 | float __ovld __conv work_group_scan_inclusive_min(float x); | ||
| 6414 | float __ovld __conv work_group_scan_inclusive_max(float x); | ||
| 6415 | -#ifdef cl_khr_fp64 | ||
| 6416 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6417 | double __ovld __conv work_group_reduce_add(double x); | ||
| 6418 | double __ovld __conv work_group_reduce_min(double x); | ||
| 6419 | double __ovld __conv work_group_reduce_max(double x); | ||
| 6420 | @@ -15327,19 +17384,18 @@ double __ovld __conv work_group_scan_exclusive_max(double x); | ||
| 6421 | double __ovld __conv work_group_scan_inclusive_add(double x); | ||
| 6422 | double __ovld __conv work_group_scan_inclusive_min(double x); | ||
| 6423 | double __ovld __conv work_group_scan_inclusive_max(double x); | ||
| 6424 | -#endif //cl_khr_fp64 | ||
| 6425 | - | ||
| 6426 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6427 | +#endif //__opencl_c_work_group_collective_functions | ||
| 6428 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6429 | |||
| 6430 | // OpenCL v2.0 s6.13.16 - Pipe Functions | ||
| 6431 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6432 | +#ifdef __opencl_c_pipes | ||
| 6433 | bool __ovld is_valid_reserve_id(reserve_id_t reserve_id); | ||
| 6434 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6435 | - | ||
| 6436 | +#endif //__opencl_c_pipes | ||
| 6437 | |||
| 6438 | // OpenCL v2.0 s6.13.17 - Enqueue Kernels | ||
| 6439 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6440 | - | ||
| 6441 | +#ifdef __opencl_c_device_enqueue | ||
| 6442 | ndrange_t __ovld ndrange_1D(size_t); | ||
| 6443 | ndrange_t __ovld ndrange_1D(size_t, size_t); | ||
| 6444 | ndrange_t __ovld ndrange_1D(size_t, size_t, size_t); | ||
| 6445 | @@ -15367,11 +17423,13 @@ bool __ovld is_valid_event (clk_event_t event); | ||
| 6446 | void __ovld capture_event_profiling_info(clk_event_t, clk_profiling_info, __global void* value); | ||
| 6447 | |||
| 6448 | queue_t __ovld get_default_queue(void); | ||
| 6449 | +#endif //__opencl_c_device_enqueue | ||
| 6450 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6451 | |||
| 6452 | // OpenCL Extension v2.0 s9.17 - Sub-groups | ||
| 6453 | |||
| 6454 | -#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) | ||
| 6455 | +#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) || \ | ||
| 6456 | + defined(__opencl_c_subgroups) | ||
| 6457 | // Shared Sub Group Functions | ||
| 6458 | uint __ovld get_sub_group_size(void); | ||
| 6459 | uint __ovld get_max_sub_group_size(void); | ||
| 6460 | @@ -15457,7 +17515,7 @@ half __ovld __conv sub_group_scan_inclusive_min(half x); | ||
| 6461 | half __ovld __conv sub_group_scan_inclusive_max(half x); | ||
| 6462 | #endif //cl_khr_fp16 | ||
| 6463 | |||
| 6464 | -#ifdef cl_khr_fp64 | ||
| 6465 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6466 | double __ovld __conv sub_group_broadcast(double x, uint sub_group_local_id); | ||
| 6467 | double __ovld __conv sub_group_reduce_add(double x); | ||
| 6468 | double __ovld __conv sub_group_reduce_min(double x); | ||
| 6469 | @@ -15468,7 +17526,7 @@ double __ovld __conv sub_group_scan_exclusive_max(double x); | ||
| 6470 | double __ovld __conv sub_group_scan_inclusive_add(double x); | ||
| 6471 | double __ovld __conv sub_group_scan_inclusive_min(double x); | ||
| 6472 | double __ovld __conv sub_group_scan_inclusive_max(double x); | ||
| 6473 | -#endif //cl_khr_fp64 | ||
| 6474 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6475 | |||
| 6476 | #endif //cl_khr_subgroups cl_intel_subgroups | ||
| 6477 | |||
| 6478 | @@ -15570,16 +17628,22 @@ uint16 __ovld __conv intel_sub_group_shuffle_xor( uint16 x, uint c ); | ||
| 6479 | long __ovld __conv intel_sub_group_shuffle_xor( long x, uint c ); | ||
| 6480 | ulong __ovld __conv intel_sub_group_shuffle_xor( ulong x, uint c ); | ||
| 6481 | |||
| 6482 | +#ifdef __opencl_c_images | ||
| 6483 | uint __ovld __conv intel_sub_group_block_read( read_only image2d_t image, int2 coord ); | ||
| 6484 | uint2 __ovld __conv intel_sub_group_block_read2( read_only image2d_t image, int2 coord ); | ||
| 6485 | uint4 __ovld __conv intel_sub_group_block_read4( read_only image2d_t image, int2 coord ); | ||
| 6486 | uint8 __ovld __conv intel_sub_group_block_read8( read_only image2d_t image, int2 coord ); | ||
| 6487 | +#endif //__opencl_c_images | ||
| 6488 | |||
| 6489 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6490 | +#ifdef __opencl_c_images | ||
| 6491 | +#ifdef __opencl_c_read_write_images | ||
| 6492 | uint __ovld __conv intel_sub_group_block_read(read_write image2d_t image, int2 coord); | ||
| 6493 | uint2 __ovld __conv intel_sub_group_block_read2(read_write image2d_t image, int2 coord); | ||
| 6494 | uint4 __ovld __conv intel_sub_group_block_read4(read_write image2d_t image, int2 coord); | ||
| 6495 | uint8 __ovld __conv intel_sub_group_block_read8(read_write image2d_t image, int2 coord); | ||
| 6496 | +#endif //__opencl_c_read_write_images | ||
| 6497 | +#endif //__opencl_c_images | ||
| 6498 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6499 | |||
| 6500 | uint __ovld __conv intel_sub_group_block_read( const __global uint* p ); | ||
| 6501 | @@ -15587,16 +17651,22 @@ uint2 __ovld __conv intel_sub_group_block_read2( const __global uint* p ); | ||
| 6502 | uint4 __ovld __conv intel_sub_group_block_read4( const __global uint* p ); | ||
| 6503 | uint8 __ovld __conv intel_sub_group_block_read8( const __global uint* p ); | ||
| 6504 | |||
| 6505 | +#ifdef __opencl_c_images | ||
| 6506 | void __ovld __conv intel_sub_group_block_write(write_only image2d_t image, int2 coord, uint data); | ||
| 6507 | void __ovld __conv intel_sub_group_block_write2(write_only image2d_t image, int2 coord, uint2 data); | ||
| 6508 | void __ovld __conv intel_sub_group_block_write4(write_only image2d_t image, int2 coord, uint4 data); | ||
| 6509 | void __ovld __conv intel_sub_group_block_write8(write_only image2d_t image, int2 coord, uint8 data); | ||
| 6510 | +#endif //__opencl_c_images | ||
| 6511 | |||
| 6512 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6513 | +#ifdef __opencl_c_images | ||
| 6514 | +#ifdef __opencl_c_read_write_images | ||
| 6515 | void __ovld __conv intel_sub_group_block_write(read_write image2d_t image, int2 coord, uint data); | ||
| 6516 | void __ovld __conv intel_sub_group_block_write2(read_write image2d_t image, int2 coord, uint2 data); | ||
| 6517 | void __ovld __conv intel_sub_group_block_write4(read_write image2d_t image, int2 coord, uint4 data); | ||
| 6518 | void __ovld __conv intel_sub_group_block_write8(read_write image2d_t image, int2 coord, uint8 data); | ||
| 6519 | +#endif // __opencl_c_read_write_images | ||
| 6520 | +#endif // __opencl_c_images | ||
| 6521 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6522 | |||
| 6523 | void __ovld __conv intel_sub_group_block_write( __global uint* p, uint data ); | ||
| 6524 | @@ -15611,7 +17681,7 @@ half __ovld __conv intel_sub_group_shuffle_up( half prev, half cur, uint c ); | ||
| 6525 | half __ovld __conv intel_sub_group_shuffle_xor( half x, uint c ); | ||
| 6526 | #endif | ||
| 6527 | |||
| 6528 | -#if defined(cl_khr_fp64) | ||
| 6529 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6530 | double __ovld __conv intel_sub_group_shuffle( double x, uint c ); | ||
| 6531 | double __ovld __conv intel_sub_group_shuffle_down( double prev, double cur, uint c ); | ||
| 6532 | double __ovld __conv intel_sub_group_shuffle_up( double prev, double cur, uint c ); | ||
| 6533 | @@ -15710,16 +17780,22 @@ ushort __ovld __conv intel_sub_group_scan_inclusive_min( ushort x ); | ||
| 6534 | short __ovld __conv intel_sub_group_scan_inclusive_max( short x ); | ||
| 6535 | ushort __ovld __conv intel_sub_group_scan_inclusive_max( ushort x ); | ||
| 6536 | |||
| 6537 | +#ifdef __opencl_c_images | ||
| 6538 | uint __ovld __conv intel_sub_group_block_read_ui( read_only image2d_t image, int2 byte_coord ); | ||
| 6539 | uint2 __ovld __conv intel_sub_group_block_read_ui2( read_only image2d_t image, int2 byte_coord ); | ||
| 6540 | uint4 __ovld __conv intel_sub_group_block_read_ui4( read_only image2d_t image, int2 byte_coord ); | ||
| 6541 | uint8 __ovld __conv intel_sub_group_block_read_ui8( read_only image2d_t image, int2 byte_coord ); | ||
| 6542 | +#endif //__opencl_c_images | ||
| 6543 | |||
| 6544 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6545 | +#ifdef __opencl_c_images | ||
| 6546 | +#ifdef __opencl_c_read_write_images | ||
| 6547 | uint __ovld __conv intel_sub_group_block_read_ui( read_write image2d_t image, int2 byte_coord ); | ||
| 6548 | uint2 __ovld __conv intel_sub_group_block_read_ui2( read_write image2d_t image, int2 byte_coord ); | ||
| 6549 | uint4 __ovld __conv intel_sub_group_block_read_ui4( read_write image2d_t image, int2 byte_coord ); | ||
| 6550 | uint8 __ovld __conv intel_sub_group_block_read_ui8( read_write image2d_t image, int2 byte_coord ); | ||
| 6551 | +#endif //__opencl_c_read_write_images | ||
| 6552 | +#endif //__opencl_c_images | ||
| 6553 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6554 | |||
| 6555 | uint __ovld __conv intel_sub_group_block_read_ui( const __global uint* p ); | ||
| 6556 | @@ -15727,16 +17803,22 @@ uint2 __ovld __conv intel_sub_group_block_read_ui2( const __global uint* p | ||
| 6557 | uint4 __ovld __conv intel_sub_group_block_read_ui4( const __global uint* p ); | ||
| 6558 | uint8 __ovld __conv intel_sub_group_block_read_ui8( const __global uint* p ); | ||
| 6559 | |||
| 6560 | +#ifdef __opencl_c_images | ||
| 6561 | void __ovld __conv intel_sub_group_block_write_ui( read_only image2d_t image, int2 byte_coord, uint data ); | ||
| 6562 | void __ovld __conv intel_sub_group_block_write_ui2( read_only image2d_t image, int2 byte_coord, uint2 data ); | ||
| 6563 | void __ovld __conv intel_sub_group_block_write_ui4( read_only image2d_t image, int2 byte_coord, uint4 data ); | ||
| 6564 | void __ovld __conv intel_sub_group_block_write_ui8( read_only image2d_t image, int2 byte_coord, uint8 data ); | ||
| 6565 | +#endif //__opencl_c_images | ||
| 6566 | |||
| 6567 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6568 | +#ifdef __opencl_c_images | ||
| 6569 | +#ifdef __opencl_c_read_write_images | ||
| 6570 | void __ovld __conv intel_sub_group_block_write_ui( read_write image2d_t image, int2 byte_coord, uint data ); | ||
| 6571 | void __ovld __conv intel_sub_group_block_write_ui2( read_write image2d_t image, int2 byte_coord, uint2 data ); | ||
| 6572 | void __ovld __conv intel_sub_group_block_write_ui4( read_write image2d_t image, int2 byte_coord, uint4 data ); | ||
| 6573 | void __ovld __conv intel_sub_group_block_write_ui8( read_write image2d_t image, int2 byte_coord, uint8 data ); | ||
| 6574 | +#endif //__opencl_c_read_write_images | ||
| 6575 | +#endif //__opencl_c_images | ||
| 6576 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6577 | |||
| 6578 | void __ovld __conv intel_sub_group_block_write_ui( __global uint* p, uint data ); | ||
| 6579 | @@ -15744,16 +17826,22 @@ void __ovld __conv intel_sub_group_block_write_ui2( __global uint* p, uint | ||
| 6580 | void __ovld __conv intel_sub_group_block_write_ui4( __global uint* p, uint4 data ); | ||
| 6581 | void __ovld __conv intel_sub_group_block_write_ui8( __global uint* p, uint8 data ); | ||
| 6582 | |||
| 6583 | +#ifdef __opencl_c_images | ||
| 6584 | ushort __ovld __conv intel_sub_group_block_read_us( read_only image2d_t image, int2 coord ); | ||
| 6585 | ushort2 __ovld __conv intel_sub_group_block_read_us2( read_only image2d_t image, int2 coord ); | ||
| 6586 | ushort4 __ovld __conv intel_sub_group_block_read_us4( read_only image2d_t image, int2 coord ); | ||
| 6587 | ushort8 __ovld __conv intel_sub_group_block_read_us8( read_only image2d_t image, int2 coord ); | ||
| 6588 | +#endif //__opencl_c_images | ||
| 6589 | |||
| 6590 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6591 | +#ifdef __opencl_c_images | ||
| 6592 | +#ifdef __opencl_c_read_write_images | ||
| 6593 | ushort __ovld __conv intel_sub_group_block_read_us(read_write image2d_t image, int2 coord); | ||
| 6594 | ushort2 __ovld __conv intel_sub_group_block_read_us2(read_write image2d_t image, int2 coord); | ||
| 6595 | ushort4 __ovld __conv intel_sub_group_block_read_us4(read_write image2d_t image, int2 coord); | ||
| 6596 | ushort8 __ovld __conv intel_sub_group_block_read_us8(read_write image2d_t image, int2 coord); | ||
| 6597 | +#endif //__opencl_c_read_write_images | ||
| 6598 | +#endif //__opencl_c_images | ||
| 6599 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6600 | |||
| 6601 | ushort __ovld __conv intel_sub_group_block_read_us( const __global ushort* p ); | ||
| 6602 | @@ -15761,16 +17849,22 @@ ushort2 __ovld __conv intel_sub_group_block_read_us2( const __global ushort* | ||
| 6603 | ushort4 __ovld __conv intel_sub_group_block_read_us4( const __global ushort* p ); | ||
| 6604 | ushort8 __ovld __conv intel_sub_group_block_read_us8( const __global ushort* p ); | ||
| 6605 | |||
| 6606 | +#ifdef __opencl_c_images | ||
| 6607 | void __ovld __conv intel_sub_group_block_write_us(write_only image2d_t image, int2 coord, ushort data); | ||
| 6608 | void __ovld __conv intel_sub_group_block_write_us2(write_only image2d_t image, int2 coord, ushort2 data); | ||
| 6609 | void __ovld __conv intel_sub_group_block_write_us4(write_only image2d_t image, int2 coord, ushort4 data); | ||
| 6610 | void __ovld __conv intel_sub_group_block_write_us8(write_only image2d_t image, int2 coord, ushort8 data); | ||
| 6611 | +#endif //__opencl_c_images | ||
| 6612 | |||
| 6613 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6614 | +#ifdef __opencl_c_images | ||
| 6615 | +#ifdef __opencl_c_read_write_images | ||
| 6616 | void __ovld __conv intel_sub_group_block_write_us(read_write image2d_t image, int2 coord, ushort data); | ||
| 6617 | void __ovld __conv intel_sub_group_block_write_us2(read_write image2d_t image, int2 coord, ushort2 data); | ||
| 6618 | void __ovld __conv intel_sub_group_block_write_us4(read_write image2d_t image, int2 coord, ushort4 data); | ||
| 6619 | void __ovld __conv intel_sub_group_block_write_us8(read_write image2d_t image, int2 coord, ushort8 data); | ||
| 6620 | +#endif //__opencl_c_read_write_images | ||
| 6621 | +#endif //__opencl_c_images | ||
| 6622 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6623 | |||
| 6624 | void __ovld __conv intel_sub_group_block_write_us( __global ushort* p, ushort data ); | ||
| 6625 | @@ -15889,6 +17983,7 @@ short2 __ovld intel_sub_group_avc_ime_adjust_ref_offset( | ||
| 6626 | short2 ref_offset, ushort2 src_coord, ushort2 ref_window_size, | ||
| 6627 | ushort2 image_size); | ||
| 6628 | |||
| 6629 | +#ifdef __opencl_c_images | ||
| 6630 | intel_sub_group_avc_ime_result_t __ovld | ||
| 6631 | intel_sub_group_avc_ime_evaluate_with_single_reference( | ||
| 6632 | read_only image2d_t src_image, read_only image2d_t ref_image, | ||
| 6633 | @@ -15929,6 +18024,7 @@ intel_sub_group_avc_ime_evaluate_with_dual_reference_streaminout( | ||
| 6634 | read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler, | ||
| 6635 | intel_sub_group_avc_ime_payload_t payload, | ||
| 6636 | intel_sub_group_avc_ime_dual_reference_streamin_t streamin_components); | ||
| 6637 | +#endif //__opencl_c_images | ||
| 6638 | |||
| 6639 | intel_sub_group_avc_ime_single_reference_streamin_t __ovld | ||
| 6640 | intel_sub_group_avc_ime_get_single_reference_streamin( | ||
| 6641 | @@ -15993,6 +18089,7 @@ intel_sub_group_avc_ref_payload_t __ovld | ||
| 6642 | intel_sub_group_avc_ref_set_bilinear_filter_enable( | ||
| 6643 | intel_sub_group_avc_ref_payload_t payload); | ||
| 6644 | |||
| 6645 | +#ifdef __opencl_c_images | ||
| 6646 | intel_sub_group_avc_ref_result_t __ovld | ||
| 6647 | intel_sub_group_avc_ref_evaluate_with_single_reference( | ||
| 6648 | read_only image2d_t src_image, read_only image2d_t ref_image, | ||
| 6649 | @@ -16011,6 +18108,7 @@ intel_sub_group_avc_ref_evaluate_with_multi_reference( | ||
| 6650 | read_only image2d_t src_image, uint packed_reference_ids, | ||
| 6651 | uchar packed_reference_field_polarities, sampler_t vme_media_sampler, | ||
| 6652 | intel_sub_group_avc_ref_payload_t payload); | ||
| 6653 | +#endif //__opencl_c_images | ||
| 6654 | |||
| 6655 | // SIC built-in functions | ||
| 6656 | intel_sub_group_avc_sic_payload_t __ovld | ||
| 6657 | @@ -16061,6 +18159,7 @@ intel_sub_group_avc_sic_set_block_based_raw_skip_sad( | ||
| 6658 | uchar block_based_skip_type, | ||
| 6659 | intel_sub_group_avc_sic_payload_t payload); | ||
| 6660 | |||
| 6661 | +#ifdef __opencl_c_images | ||
| 6662 | intel_sub_group_avc_sic_result_t __ovld | ||
| 6663 | intel_sub_group_avc_sic_evaluate_ipe( | ||
| 6664 | read_only image2d_t src_image, sampler_t vme_media_sampler, | ||
| 6665 | @@ -16083,6 +18182,7 @@ intel_sub_group_avc_sic_evaluate_with_multi_reference( | ||
| 6666 | read_only image2d_t src_image, uint packed_reference_ids, | ||
| 6667 | uchar packed_reference_field_polarities, sampler_t vme_media_sampler, | ||
| 6668 | intel_sub_group_avc_sic_payload_t payload); | ||
| 6669 | +#endif //__opencl_c_images | ||
| 6670 | |||
| 6671 | uchar __ovld intel_sub_group_avc_sic_get_ipe_luma_shape( | ||
| 6672 | intel_sub_group_avc_sic_result_t result); | ||
| 6673 | diff --git a/clang/lib/Parse/ParseDecl.cpp b/clang/lib/Parse/ParseDecl.cpp | ||
| 6674 | index 6353e14bc41a..a8c216de6e04 100644 | ||
| 6675 | --- a/clang/lib/Parse/ParseDecl.cpp | ||
| 6676 | +++ b/clang/lib/Parse/ParseDecl.cpp | ||
| 6677 | @@ -3904,8 +3904,7 @@ void Parser::ParseDeclarationSpecifiers(DeclSpec &DS, | ||
| 6678 | isInvalid = DS.SetTypeAltiVecBool(true, Loc, PrevSpec, DiagID, Policy); | ||
| 6679 | break; | ||
| 6680 | case tok::kw_pipe: | ||
| 6681 | - if (!getLangOpts().OpenCL || (getLangOpts().OpenCLVersion < 200 && | ||
| 6682 | - !getLangOpts().OpenCLCPlusPlus)) { | ||
| 6683 | + if (!getLangOpts().OpenCLPipeKeyword) { | ||
| 6684 | // OpenCL 2.0 defined this keyword. OpenCL 1.2 and earlier should | ||
| 6685 | // support the "pipe" word as identifier. | ||
| 6686 | Tok.getIdentifierInfo()->revertTokenIDToIdentifier(); | ||
| 6687 | @@ -4027,8 +4026,7 @@ void Parser::ParseDeclarationSpecifiers(DeclSpec &DS, | ||
| 6688 | case tok::kw___generic: | ||
| 6689 | // generic address space is introduced only in OpenCL v2.0 | ||
| 6690 | // see OpenCL C Spec v2.0 s6.5.5 | ||
| 6691 | - if (Actions.getLangOpts().OpenCLVersion < 200 && | ||
| 6692 | - !Actions.getLangOpts().OpenCLCPlusPlus) { | ||
| 6693 | + if (!Actions.getLangOpts().OpenCLGenericKeyword) { | ||
| 6694 | DiagID = diag::err_opencl_unknown_type_specifier; | ||
| 6695 | PrevSpec = Tok.getIdentifierInfo()->getNameStart(); | ||
| 6696 | isInvalid = true; | ||
| 6697 | @@ -5050,8 +5048,7 @@ bool Parser::isDeclarationSpecifier(bool DisambiguatingWithExpression) { | ||
| 6698 | default: return false; | ||
| 6699 | |||
| 6700 | case tok::kw_pipe: | ||
| 6701 | - return (getLangOpts().OpenCL && getLangOpts().OpenCLVersion >= 200) || | ||
| 6702 | - getLangOpts().OpenCLCPlusPlus; | ||
| 6703 | + return getLangOpts().OpenCLPipeKeyword; | ||
| 6704 | |||
| 6705 | case tok::identifier: // foo::bar | ||
| 6706 | // Unfortunate hack to support "Class.factoryMethod" notation. | ||
| 6707 | @@ -5557,8 +5554,7 @@ static bool isPtrOperatorToken(tok::TokenKind Kind, const LangOptions &Lang, | ||
| 6708 | if (Kind == tok::star || Kind == tok::caret) | ||
| 6709 | return true; | ||
| 6710 | |||
| 6711 | - if (Kind == tok::kw_pipe && | ||
| 6712 | - ((Lang.OpenCL && Lang.OpenCLVersion >= 200) || Lang.OpenCLCPlusPlus)) | ||
| 6713 | + if (Kind == tok::kw_pipe && Lang.OpenCLPipeKeyword) | ||
| 6714 | return true; | ||
| 6715 | |||
| 6716 | if (!Lang.CPlusPlus) | ||
| 6717 | diff --git a/clang/lib/Parse/ParsePragma.cpp b/clang/lib/Parse/ParsePragma.cpp | ||
| 6718 | index df411e1928d6..9a40ce888695 100644 | ||
| 6719 | --- a/clang/lib/Parse/ParsePragma.cpp | ||
| 6720 | +++ b/clang/lib/Parse/ParsePragma.cpp | ||
| 6721 | @@ -697,12 +697,14 @@ void Parser::HandlePragmaOpenCLExtension() { | ||
| 6722 | if (Name == "all") { | ||
| 6723 | if (State == Disable) { | ||
| 6724 | Opt.disableAll(); | ||
| 6725 | - Opt.enableSupportedCore(getLangOpts()); | ||
| 6726 | + Opt.enableSupportedCore(); | ||
| 6727 | } else { | ||
| 6728 | PP.Diag(NameLoc, diag::warn_pragma_expected_predicate) << 1; | ||
| 6729 | } | ||
| 6730 | + } else if (Opt.isFeature(Name)) { | ||
| 6731 | + PP.Diag(NameLoc, diag::warn_opencl_pragma_feature_ignore) << Ident; | ||
| 6732 | } else if (State == Begin) { | ||
| 6733 | - if (!Opt.isKnown(Name) || !Opt.isSupported(Name, getLangOpts())) { | ||
| 6734 | + if (!Opt.isKnown(Name) || !Opt.isSupported(Name)) { | ||
| 6735 | Opt.support(Name); | ||
| 6736 | } | ||
| 6737 | Actions.setCurrentOpenCLExtension(Name); | ||
| 6738 | @@ -712,9 +714,9 @@ void Parser::HandlePragmaOpenCLExtension() { | ||
| 6739 | Actions.setCurrentOpenCLExtension(""); | ||
| 6740 | } else if (!Opt.isKnown(Name)) | ||
| 6741 | PP.Diag(NameLoc, diag::warn_pragma_unknown_extension) << Ident; | ||
| 6742 | - else if (Opt.isSupportedExtension(Name, getLangOpts())) | ||
| 6743 | + else if (Opt.isSupportedExtension(Name)) | ||
| 6744 | Opt.enable(Name, State == Enable); | ||
| 6745 | - else if (Opt.isSupportedCore(Name, getLangOpts())) | ||
| 6746 | + else if (Opt.isSupportedCore(Name)) | ||
| 6747 | PP.Diag(NameLoc, diag::warn_pragma_extension_is_core) << Ident; | ||
| 6748 | else | ||
| 6749 | PP.Diag(NameLoc, diag::warn_pragma_unsupported_extension) << Ident; | ||
| 6750 | diff --git a/clang/lib/Sema/OpenCLBuiltins.td b/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6751 | index 9d6bb411eff8..d352d35f1e46 100644 | ||
| 6752 | --- a/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6753 | +++ b/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6754 | @@ -22,11 +22,13 @@ | ||
| 6755 | class Version<int _Version> { | ||
| 6756 | int ID = _Version; | ||
| 6757 | } | ||
| 6758 | + | ||
| 6759 | def CLAll : Version< 0>; | ||
| 6760 | def CL10 : Version<100>; | ||
| 6761 | def CL11 : Version<110>; | ||
| 6762 | def CL12 : Version<120>; | ||
| 6763 | def CL20 : Version<200>; | ||
| 6764 | +def CL30 : Version<300>; | ||
| 6765 | |||
| 6766 | // Address spaces | ||
| 6767 | // Pointer types need to be assigned an address space. | ||
| 6768 | @@ -65,6 +67,14 @@ def FuncExtKhrGlMsaaSharing : FunctionExtension<"cl_khr_gl_msaa_sha | ||
| 6769 | // Multiple extensions | ||
| 6770 | def FuncExtKhrMipmapAndWrite3d : FunctionExtension<"cl_khr_mipmap_image cl_khr_3d_image_writes">; | ||
| 6771 | |||
| 6772 | +// Features | ||
| 6773 | +def FuncExtGenericAddressSpace : FunctionExtension<"__opencl_c_generic_address_space">; | ||
| 6774 | +def FuncExtWorkGroupCollective : FunctionExtension<"__opencl_c_work_group_collective_functions">; | ||
| 6775 | +def FuncExtPipes : FunctionExtension<"__opencl_c_pipes">; | ||
| 6776 | +def FuncExtDeviceSidEenqueue : FunctionExtension<"__opencl_c_device_enqueue">; | ||
| 6777 | +def FuncNonExplicitAtomicFeatures : FunctionExtension<"__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device">; | ||
| 6778 | +def FuncNonExplicitAtomicFeaturesAndGenericAS : FunctionExtension<"__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device __opencl_c_generic_address_space">; | ||
| 6779 | + | ||
| 6780 | // Qualified Type. These map to ASTContext::QualType. | ||
| 6781 | class QualType<string _Name, bit _IsAbstract=0> { | ||
| 6782 | // Name of the field or function in a clang::ASTContext | ||
| 6783 | @@ -230,13 +240,9 @@ class Builtin<string _Name, list<Type> _Signature, list<bit> _Attributes = Attr. | ||
| 6784 | bit IsConv = _Attributes[2]; | ||
| 6785 | // OpenCL extensions to which the function belongs. | ||
| 6786 | FunctionExtension Extension = FuncExtNone; | ||
| 6787 | - // Version of OpenCL from which the function is available (e.g.: CL10). | ||
| 6788 | - // MinVersion is inclusive. | ||
| 6789 | - Version MinVersion = CL10; | ||
| 6790 | - // Version of OpenCL from which the function is not supported anymore. | ||
| 6791 | - // MaxVersion is exclusive. | ||
| 6792 | + // List of OpenCL version in which this function available. | ||
| 6793 | // CLAll makes the function available for all versions. | ||
| 6794 | - Version MaxVersion = CLAll; | ||
| 6795 | + list<Version> Versions = [CLAll]; | ||
| 6796 | } | ||
| 6797 | |||
| 6798 | //===----------------------------------------------------------------------===// | ||
| 6799 | @@ -398,7 +404,7 @@ foreach name = ["get_global_size", "get_global_id", "get_local_size", | ||
| 6800 | def : Builtin<name, [Size, UInt], Attr.Const>; | ||
| 6801 | } | ||
| 6802 | |||
| 6803 | -let MinVersion = CL20 in { | ||
| 6804 | +let Versions = [CL20, CL30] in { | ||
| 6805 | def : Builtin<"get_enqueued_local_size", [Size, UInt]>; | ||
| 6806 | foreach name = ["get_global_linear_id", "get_local_linear_id"] in { | ||
| 6807 | def : Builtin<name, [Size]>; | ||
| 6808 | @@ -471,7 +477,7 @@ foreach name = ["fma", "mad"] in { | ||
| 6809 | } | ||
| 6810 | |||
| 6811 | // --- Version dependent --- | ||
| 6812 | -let MaxVersion = CL20 in { | ||
| 6813 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6814 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6815 | foreach name = ["fract", "modf", "sincos"] in { | ||
| 6816 | def : Builtin<name, [FGenTypeN, FGenTypeN, PointerType<FGenTypeN, AS>]>; | ||
| 6817 | @@ -488,7 +494,9 @@ let MaxVersion = CL20 in { | ||
| 6818 | } | ||
| 6819 | } | ||
| 6820 | } | ||
| 6821 | -let MinVersion = CL20 in { | ||
| 6822 | + | ||
| 6823 | +let Versions = [CL20, CL30] in { | ||
| 6824 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6825 | foreach name = ["fract", "modf", "sincos"] in { | ||
| 6826 | def : Builtin<name, [FGenTypeN, FGenTypeN, PointerType<FGenTypeN, GenericAS>]>; | ||
| 6827 | } | ||
| 6828 | @@ -501,6 +509,7 @@ let MinVersion = CL20 in { | ||
| 6829 | def : Builtin<name, [Type, Type, Type, PointerType<GenTypeIntVecAndScalar, GenericAS>]>; | ||
| 6830 | } | ||
| 6831 | } | ||
| 6832 | + } | ||
| 6833 | } | ||
| 6834 | |||
| 6835 | // --- Table 9 --- | ||
| 6836 | @@ -531,7 +540,7 @@ foreach name = ["abs"] in { | ||
| 6837 | foreach name = ["clz", "popcount"] in { | ||
| 6838 | def : Builtin<name, [AIGenTypeN, AIGenTypeN], Attr.Const>; | ||
| 6839 | } | ||
| 6840 | -let MinVersion = CL20 in { | ||
| 6841 | +let Versions = [CL20, CL30] in { | ||
| 6842 | foreach name = ["ctz"] in { | ||
| 6843 | def : Builtin<name, [AIGenTypeN, AIGenTypeN]>; | ||
| 6844 | } | ||
| 6845 | @@ -705,7 +714,7 @@ foreach name = ["select"] in { | ||
| 6846 | // --- Table 15 --- | ||
| 6847 | // Variants for OpenCL versions below 2.0, using pointers to the global, local | ||
| 6848 | // and private address spaces. | ||
| 6849 | -let MaxVersion = CL20 in { | ||
| 6850 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6851 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6852 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6853 | foreach name = ["vload" # VSize] in { | ||
| 6854 | @@ -748,7 +757,8 @@ let MaxVersion = CL20 in { | ||
| 6855 | } | ||
| 6856 | // Variants for OpenCL versions above 2.0, using pointers to the generic | ||
| 6857 | // address space. | ||
| 6858 | -let MinVersion = CL20 in { | ||
| 6859 | +let Versions = [CL20, CL30] in { | ||
| 6860 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6861 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6862 | foreach name = ["vload" # VSize] in { | ||
| 6863 | def : Builtin<name, [VectorType<Char, VSize>, Size, PointerType<ConstType<Char>, GenericAS>]>; | ||
| 6864 | @@ -786,6 +796,7 @@ let MinVersion = CL20 in { | ||
| 6865 | } | ||
| 6866 | } | ||
| 6867 | } | ||
| 6868 | + } | ||
| 6869 | } | ||
| 6870 | // Variants using pointers to the constant address space. | ||
| 6871 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6872 | @@ -812,7 +823,7 @@ foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6873 | } | ||
| 6874 | } | ||
| 6875 | } | ||
| 6876 | -let MaxVersion = CL20 in { | ||
| 6877 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6878 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6879 | def : Builtin<"vload_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6880 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6881 | @@ -832,7 +843,8 @@ let MaxVersion = CL20 in { | ||
| 6882 | } | ||
| 6883 | } | ||
| 6884 | } | ||
| 6885 | -let MinVersion = CL20 in { | ||
| 6886 | +let Versions = [CL20, CL30] in { | ||
| 6887 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6888 | foreach AS = [GenericAS] in { | ||
| 6889 | def : Builtin<"vload_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6890 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6891 | @@ -851,6 +863,7 @@ let MinVersion = CL20 in { | ||
| 6892 | } | ||
| 6893 | } | ||
| 6894 | } | ||
| 6895 | + } | ||
| 6896 | } | ||
| 6897 | |||
| 6898 | foreach AS = [ConstantAS] in { | ||
| 6899 | @@ -875,7 +888,9 @@ foreach name = ["async_work_group_strided_copy"] in { | ||
| 6900 | def : Builtin<name, [Event, PointerType<AGenTypeN, GlobalAS>, PointerType<ConstType<AGenTypeN>, LocalAS>, Size, Size, Event]>; | ||
| 6901 | } | ||
| 6902 | foreach name = ["wait_group_events"] in { | ||
| 6903 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6904 | def : Builtin<name, [Void, Int, PointerType<Event, GenericAS>]>; | ||
| 6905 | + } | ||
| 6906 | } | ||
| 6907 | foreach name = ["prefetch"] in { | ||
| 6908 | def : Builtin<name, [Void, PointerType<ConstType<AGenTypeN>, GlobalAS>, Size]>; | ||
| 6909 | @@ -1154,7 +1169,8 @@ foreach aQual = ["WO", "RW"] in { | ||
| 6910 | //-------------------------------------------------------------------- | ||
| 6911 | // OpenCL v2.0 s6.13.15 - Work-group Functions | ||
| 6912 | // --- Table 26 --- | ||
| 6913 | -let MinVersion = CL20 in { | ||
| 6914 | +let Versions = [CL20, CL30] in { | ||
| 6915 | + let Extension = FuncExtWorkGroupCollective in { | ||
| 6916 | foreach name = ["work_group_all", "work_group_any"] in { | ||
| 6917 | def : Builtin<name, [Int, Int], Attr.Convergent>; | ||
| 6918 | } | ||
| 6919 | @@ -1169,11 +1185,12 @@ let MinVersion = CL20 in { | ||
| 6920 | def : Builtin<name # op, [IntLongFloatGenType1, IntLongFloatGenType1], Attr.Convergent>; | ||
| 6921 | } | ||
| 6922 | } | ||
| 6923 | + } | ||
| 6924 | } | ||
| 6925 | |||
| 6926 | |||
| 6927 | // OpenCL v2.0 s9.17.3: Additions to section 6.13.1: Work-Item Functions | ||
| 6928 | -let MinVersion = CL20 in { | ||
| 6929 | +let Versions = [CL20] in { | ||
| 6930 | let Extension = FuncExtKhrSubgroups in { | ||
| 6931 | def get_sub_group_size : Builtin<"get_sub_group_size", [UInt]>; | ||
| 6932 | def get_max_sub_group_size : Builtin<"get_max_sub_group_size", [UInt]>; | ||
| 6933 | diff --git a/clang/lib/Sema/Sema.cpp b/clang/lib/Sema/Sema.cpp | ||
| 6934 | index 9cfce5a63b1d..c26f45f62668 100644 | ||
| 6935 | --- a/clang/lib/Sema/Sema.cpp | ||
| 6936 | +++ b/clang/lib/Sema/Sema.cpp | ||
| 6937 | @@ -286,9 +286,10 @@ void Sema::Initialize() { | ||
| 6938 | // Initialize predefined OpenCL types and supported extensions and (optional) | ||
| 6939 | // core features. | ||
| 6940 | if (getLangOpts().OpenCL) { | ||
| 6941 | + getOpenCLOptions().setOpenCLVersion(getLangOpts()); | ||
| 6942 | getOpenCLOptions().addSupport( | ||
| 6943 | Context.getTargetInfo().getSupportedOpenCLOpts()); | ||
| 6944 | - getOpenCLOptions().enableSupportedCore(getLangOpts()); | ||
| 6945 | + getOpenCLOptions().enableSupportedCore(); | ||
| 6946 | addImplicitTypedef("sampler_t", Context.OCLSamplerTy); | ||
| 6947 | addImplicitTypedef("event_t", Context.OCLEventTy); | ||
| 6948 | if (getLangOpts().OpenCLCPlusPlus || getLangOpts().OpenCLVersion >= 200) { | ||
| 6949 | @@ -344,12 +345,18 @@ void Sema::Initialize() { | ||
| 6950 | "cl_khr_int64_base_atomics cl_khr_int64_extended_atomics"); | ||
| 6951 | |||
| 6952 | setOpenCLExtensionForType(AtomicDoubleT, "cl_khr_fp64"); | ||
| 6953 | + setOpenCLExtensionForType(Context.OCLReserveIDTy, "__opencl_c_pipes"); | ||
| 6954 | + setOpenCLExtensionForType(Context.OCLClkEventTy, | ||
| 6955 | + "__opencl_c_device_enqueue"); | ||
| 6956 | + setOpenCLExtensionForType(Context.OCLQueueTy, | ||
| 6957 | + "__opencl_c_device_enqueue"); | ||
| 6958 | } | ||
| 6959 | |||
| 6960 | setOpenCLExtensionForType(Context.DoubleTy, "cl_khr_fp64"); | ||
| 6961 | |||
| 6962 | -#define GENERIC_IMAGE_TYPE_EXT(Type, Id, Ext) \ | ||
| 6963 | - setOpenCLExtensionForType(Context.Id, Ext); | ||
| 6964 | +#define GENERIC_IMAGE_TYPE_EXT(Type, Id, Ext) \ | ||
| 6965 | + setOpenCLExtensionForType(Context.Id, Ext); \ | ||
| 6966 | + setOpenCLExtensionForType(Context.Id, "__opencl_c_images"); | ||
| 6967 | #include "clang/Basic/OpenCLImageTypes.def" | ||
| 6968 | #define EXT_OPAQUE_TYPE(ExtType, Id, Ext) \ | ||
| 6969 | addImplicitTypedef(#ExtType, Context.Id##Ty); \ | ||
| 6970 | @@ -2293,6 +2300,27 @@ bool Sema::isOpenCLDisabledDecl(Decl *FD) { | ||
| 6971 | return false; | ||
| 6972 | } | ||
| 6973 | |||
| 6974 | +template <typename DiagLocT, typename DiagInfoT> | ||
| 6975 | +void Sema::DiagnoseOpenCLRequiresOption(llvm::StringRef OpenCLOptName, | ||
| 6976 | + DiagLocT DiagLoc, DiagInfoT DiagInfo, | ||
| 6977 | + unsigned Selector, | ||
| 6978 | + SourceRange SrcRange) { | ||
| 6979 | + const auto &LO = getLangOpts(); | ||
| 6980 | + auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 6981 | + // For versions higher that 3.0 diagnosing feature | ||
| 6982 | + if (CLVer >= 300) { | ||
| 6983 | + OpenCLOptName = | ||
| 6984 | + llvm::StringSwitch<llvm::StringRef>(OpenCLOptName) | ||
| 6985 | + .Case("cl_khr_3d_image_writes", "__opencl_c_3d_image_writes") | ||
| 6986 | + .Case("cl_khr_subgroups", "__opencl_c_subgroups") | ||
| 6987 | + .Case("cl_khr_fp64", "__opencl_c_fp64") | ||
| 6988 | + .Default(OpenCLOptName); | ||
| 6989 | + } | ||
| 6990 | + | ||
| 6991 | + Diag(DiagLoc, diag::err_opencl_requires_extension) | ||
| 6992 | + << Selector << DiagInfo << OpenCLOptName << SrcRange; | ||
| 6993 | +} | ||
| 6994 | + | ||
| 6995 | template <typename T, typename DiagLocT, typename DiagInfoT, typename MapT> | ||
| 6996 | bool Sema::checkOpenCLDisabledTypeOrDecl(T D, DiagLocT DiagLoc, | ||
| 6997 | DiagInfoT DiagInfo, MapT &Map, | ||
| 6998 | @@ -2304,8 +2332,7 @@ bool Sema::checkOpenCLDisabledTypeOrDecl(T D, DiagLocT DiagLoc, | ||
| 6999 | bool Disabled = false; | ||
| 7000 | for (auto &I : Loc->second) { | ||
| 7001 | if (I != CurrOpenCLExtension && !getOpenCLOptions().isEnabled(I)) { | ||
| 7002 | - Diag(DiagLoc, diag::err_opencl_requires_extension) << Selector << DiagInfo | ||
| 7003 | - << I << SrcRange; | ||
| 7004 | + DiagnoseOpenCLRequiresOption(I, DiagLoc, DiagInfo, Selector, SrcRange); | ||
| 7005 | Disabled = true; | ||
| 7006 | } | ||
| 7007 | } | ||
| 7008 | @@ -2341,3 +2368,13 @@ bool Sema::checkOpenCLDisabledDecl(const NamedDecl &D, const Expr &E) { | ||
| 7009 | return checkOpenCLDisabledTypeOrDecl(&D, E.getBeginLoc(), FnName, | ||
| 7010 | OpenCLDeclExtMap, 1, D.getSourceRange()); | ||
| 7011 | } | ||
| 7012 | + | ||
| 7013 | +bool Sema::checkOpenCLSubgroupExtForCallExpr(CallExpr *Call) { | ||
| 7014 | + if (!getOpenCLOptions().isEnabled("cl_khr_subgroups")) { | ||
| 7015 | + DiagnoseOpenCLRequiresOption("cl_khr_subgroups", Call->getBeginLoc(), | ||
| 7016 | + Call->getDirectCallee(), 1, | ||
| 7017 | + Call->getSourceRange()); | ||
| 7018 | + return true; | ||
| 7019 | + } | ||
| 7020 | + return false; | ||
| 7021 | +} | ||
| 7022 | diff --git a/clang/lib/Sema/SemaChecking.cpp b/clang/lib/Sema/SemaChecking.cpp | ||
| 7023 | index 74742023d1b3..efa3b6ab0eb6 100644 | ||
| 7024 | --- a/clang/lib/Sema/SemaChecking.cpp | ||
| 7025 | +++ b/clang/lib/Sema/SemaChecking.cpp | ||
| 7026 | @@ -597,20 +597,11 @@ static bool checkOpenCLBlockArgs(Sema &S, Expr *BlockArg) { | ||
| 7027 | return IllegalParams; | ||
| 7028 | } | ||
| 7029 | |||
| 7030 | -static bool checkOpenCLSubgroupExt(Sema &S, CallExpr *Call) { | ||
| 7031 | - if (!S.getOpenCLOptions().isEnabled("cl_khr_subgroups")) { | ||
| 7032 | - S.Diag(Call->getBeginLoc(), diag::err_opencl_requires_extension) | ||
| 7033 | - << 1 << Call->getDirectCallee() << "cl_khr_subgroups"; | ||
| 7034 | - return true; | ||
| 7035 | - } | ||
| 7036 | - return false; | ||
| 7037 | -} | ||
| 7038 | - | ||
| 7039 | static bool SemaOpenCLBuiltinNDRangeAndBlock(Sema &S, CallExpr *TheCall) { | ||
| 7040 | if (checkArgCount(S, TheCall, 2)) | ||
| 7041 | return true; | ||
| 7042 | |||
| 7043 | - if (checkOpenCLSubgroupExt(S, TheCall)) | ||
| 7044 | + if (S.checkOpenCLSubgroupExtForCallExpr(TheCall)) | ||
| 7045 | return true; | ||
| 7046 | |||
| 7047 | // First argument is an ndrange_t type. | ||
| 7048 | @@ -1564,7 +1555,7 @@ Sema::CheckBuiltinFunctionCall(FunctionDecl *FDecl, unsigned BuiltinID, | ||
| 7049 | break; | ||
| 7050 | case Builtin::BIsub_group_reserve_read_pipe: | ||
| 7051 | case Builtin::BIsub_group_reserve_write_pipe: | ||
| 7052 | - if (checkOpenCLSubgroupExt(*this, TheCall) || | ||
| 7053 | + if (checkOpenCLSubgroupExtForCallExpr(TheCall) || | ||
| 7054 | SemaBuiltinReserveRWPipe(*this, TheCall)) | ||
| 7055 | return ExprError(); | ||
| 7056 | break; | ||
| 7057 | @@ -1577,7 +1568,7 @@ Sema::CheckBuiltinFunctionCall(FunctionDecl *FDecl, unsigned BuiltinID, | ||
| 7058 | break; | ||
| 7059 | case Builtin::BIsub_group_commit_read_pipe: | ||
| 7060 | case Builtin::BIsub_group_commit_write_pipe: | ||
| 7061 | - if (checkOpenCLSubgroupExt(*this, TheCall) || | ||
| 7062 | + if (checkOpenCLSubgroupExtForCallExpr(TheCall) || | ||
| 7063 | SemaBuiltinCommitRWPipe(*this, TheCall)) | ||
| 7064 | return ExprError(); | ||
| 7065 | break; | ||
| 7066 | @@ -4314,6 +4305,20 @@ DiagnoseCStringFormatDirectiveInCFAPI(Sema &S, | ||
| 7067 | } | ||
| 7068 | } | ||
| 7069 | |||
| 7070 | +bool Sema::isSupportedOpenCLOMemoryOrdering(int64_t Ordering) const { | ||
| 7071 | + assert(llvm::isValidAtomicOrderingCABI(Ordering)); | ||
| 7072 | + auto OrderingCABI = (llvm::AtomicOrderingCABI)Ordering; | ||
| 7073 | + switch (OrderingCABI) { | ||
| 7074 | + case llvm::AtomicOrderingCABI::acquire: | ||
| 7075 | + case llvm::AtomicOrderingCABI::release: | ||
| 7076 | + case llvm::AtomicOrderingCABI::acq_rel: | ||
| 7077 | + return OpenCLFeatures.isEnabled("__opencl_c_atomic_order_acq_rel"); | ||
| 7078 | + | ||
| 7079 | + default: | ||
| 7080 | + return true; | ||
| 7081 | + } | ||
| 7082 | +} | ||
| 7083 | + | ||
| 7084 | /// Determine whether the given type has a non-null nullability annotation. | ||
| 7085 | static bool isNonNullType(ASTContext &ctx, QualType type) { | ||
| 7086 | if (auto nullability = type->getNullability(ctx)) | ||
| 7087 | @@ -5067,10 +5072,17 @@ ExprResult Sema::BuildAtomicExpr(SourceRange CallRange, SourceRange ExprRange, | ||
| 7088 | if (SubExprs.size() >= 2 && Form != Init) { | ||
| 7089 | llvm::APSInt Result(32); | ||
| 7090 | if (SubExprs[1]->isIntegerConstantExpr(Result, Context) && | ||
| 7091 | - !isValidOrderingForOp(Result.getSExtValue(), Op)) | ||
| 7092 | + !isValidOrderingForOp(Result.getSExtValue(), Op)) { | ||
| 7093 | Diag(SubExprs[1]->getBeginLoc(), | ||
| 7094 | diag::warn_atomic_op_has_invalid_memory_order) | ||
| 7095 | << SubExprs[1]->getSourceRange(); | ||
| 7096 | + } else if (IsOpenCL && | ||
| 7097 | + !isSupportedOpenCLOMemoryOrdering(Result.getSExtValue())) { | ||
| 7098 | + Diag(SubExprs[1]->getBeginLoc(), | ||
| 7099 | + diag::err_opencl_memory_ordering_require_feat) | ||
| 7100 | + << SubExprs[1]->getSourceRange(); | ||
| 7101 | + return ExprError(); | ||
| 7102 | + } | ||
| 7103 | } | ||
| 7104 | |||
| 7105 | if (auto ScopeModel = AtomicExpr::getScopeModel(Op)) { | ||
| 7106 | diff --git a/clang/lib/Sema/SemaDecl.cpp b/clang/lib/Sema/SemaDecl.cpp | ||
| 7107 | index 64146f4a912f..c1e629b5dc76 100644 | ||
| 7108 | --- a/clang/lib/Sema/SemaDecl.cpp | ||
| 7109 | +++ b/clang/lib/Sema/SemaDecl.cpp | ||
| 7110 | @@ -6152,7 +6152,9 @@ void Sema::deduceOpenCLAddressSpace(ValueDecl *Decl) { | ||
| 7111 | if (Type->isSamplerT() || Type->isVoidType()) | ||
| 7112 | return; | ||
| 7113 | LangAS ImplAS = LangAS::opencl_private; | ||
| 7114 | - if ((getLangOpts().OpenCLCPlusPlus || getLangOpts().OpenCLVersion >= 200) && | ||
| 7115 | + if ((getLangOpts().OpenCLCPlusPlus || | ||
| 7116 | + getOpenCLOptions().isEnabled( | ||
| 7117 | + "__opencl_c_program_scope_global_variables")) && | ||
| 7118 | Var->hasGlobalStorage()) | ||
| 7119 | ImplAS = LangAS::opencl_global; | ||
| 7120 | // If the original type from a decayed type is an array type and that array | ||
| 7121 | @@ -7682,6 +7684,10 @@ void Sema::CheckVariableDeclarationType(VarDecl *NewVD) { | ||
| 7122 | // OpenCL C v2.0 s6.5.1 - Variables defined at program scope and static | ||
| 7123 | // variables inside a function can also be declared in the global | ||
| 7124 | // address space. | ||
| 7125 | + // OpenCL C v3.0 s5.5 - For OpenCL C 2.0, or with the | ||
| 7126 | + // __opencl_c_program_scope_global_variables feature macro, the | ||
| 7127 | + // address space for a variable at program scope or a static variable | ||
| 7128 | + // also be __global | ||
| 7129 | // C++ for OpenCL inherits rule from OpenCL C v2.0. | ||
| 7130 | // FIXME: Adding local AS in C++ for OpenCL might make sense. | ||
| 7131 | if (NewVD->isFileVarDecl() || NewVD->isStaticLocal() || | ||
| 7132 | @@ -7689,10 +7695,11 @@ void Sema::CheckVariableDeclarationType(VarDecl *NewVD) { | ||
| 7133 | if (!T->isSamplerT() && | ||
| 7134 | !(T.getAddressSpace() == LangAS::opencl_constant || | ||
| 7135 | (T.getAddressSpace() == LangAS::opencl_global && | ||
| 7136 | - (getLangOpts().OpenCLVersion == 200 || | ||
| 7137 | - getLangOpts().OpenCLCPlusPlus)))) { | ||
| 7138 | + (OpenCLFeatures.isEnabled( | ||
| 7139 | + "__opencl_c_program_scope_global_variables"))))) { | ||
| 7140 | int Scope = NewVD->isStaticLocal() | NewVD->hasExternalStorage() << 1; | ||
| 7141 | - if (getLangOpts().OpenCLVersion == 200 || getLangOpts().OpenCLCPlusPlus) | ||
| 7142 | + if (OpenCLFeatures.isEnabled( | ||
| 7143 | + "__opencl_c_program_scope_global_variables")) | ||
| 7144 | Diag(NewVD->getLocation(), diag::err_opencl_global_invalid_addr_space) | ||
| 7145 | << Scope << "global or constant"; | ||
| 7146 | else | ||
| 7147 | diff --git a/clang/lib/Sema/SemaDeclAttr.cpp b/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7148 | index 849bc09063b3..c963b95b131a 100644 | ||
| 7149 | --- a/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7150 | +++ b/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7151 | @@ -6362,7 +6362,7 @@ static void handleInternalLinkageAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7152 | } | ||
| 7153 | |||
| 7154 | static void handleOpenCLNoSVMAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7155 | - if (S.LangOpts.OpenCLVersion != 200) | ||
| 7156 | + if (S.LangOpts.OpenCLVersion < 200) | ||
| 7157 | S.Diag(AL.getLoc(), diag::err_attribute_requires_opencl_version) | ||
| 7158 | << AL << "2.0" << 0; | ||
| 7159 | else | ||
| 7160 | @@ -6446,6 +6446,13 @@ static void handleOpenCLAccessAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7161 | << AL << PDecl->getType() << DeclTy->isImageType(); | ||
| 7162 | D->setInvalidDecl(true); | ||
| 7163 | return; | ||
| 7164 | + } else if ((!S.getLangOpts().OpenCLCPlusPlus && | ||
| 7165 | + S.getLangOpts().OpenCLVersion >= 200) && | ||
| 7166 | + !S.getOpenCLOptions().isEnabled( | ||
| 7167 | + "__opencl_c_read_write_images")) { | ||
| 7168 | + S.Diag(AL.getLoc(), diag::err_opencl_requires_extension) | ||
| 7169 | + << 0 << PDecl->getType() << "__opencl_c_read_write_images"; | ||
| 7170 | + return; | ||
| 7171 | } | ||
| 7172 | } | ||
| 7173 | } | ||
| 7174 | diff --git a/clang/lib/Sema/SemaDeclCXX.cpp b/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7175 | index 831e55046e80..4481a59b4517 100644 | ||
| 7176 | --- a/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7177 | +++ b/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7178 | @@ -14906,6 +14906,11 @@ CheckOperatorNewDeleteTypes(Sema &SemaRef, const FunctionDecl *FnDecl, | ||
| 7179 | if (auto *PtrTy = ResultType->getAs<PointerType>()) { | ||
| 7180 | ResultType = RemoveAddressSpaceFromPtr(SemaRef, PtrTy); | ||
| 7181 | } | ||
| 7182 | + if (CanQual<PointerType> ExpectedPtrTy = | ||
| 7183 | + ExpectedResultType->getAs<PointerType>()) { | ||
| 7184 | + ExpectedResultType = SemaRef.Context.getCanonicalType( | ||
| 7185 | + RemoveAddressSpaceFromPtr(SemaRef, ExpectedPtrTy->getTypePtr())); | ||
| 7186 | + } | ||
| 7187 | } | ||
| 7188 | |||
| 7189 | // Check that the result type is what we expect. | ||
| 7190 | @@ -14939,6 +14944,11 @@ CheckOperatorNewDeleteTypes(Sema &SemaRef, const FunctionDecl *FnDecl, | ||
| 7191 | FnDecl->getParamDecl(0)->getType()->getAs<PointerType>()) { | ||
| 7192 | FirstParamType = RemoveAddressSpaceFromPtr(SemaRef, PtrTy); | ||
| 7193 | } | ||
| 7194 | + if (CanQual<PointerType> ExpectedPtrTy = | ||
| 7195 | + ExpectedFirstParamType->getAs<PointerType>()) { | ||
| 7196 | + ExpectedFirstParamType = SemaRef.Context.getCanonicalType( | ||
| 7197 | + RemoveAddressSpaceFromPtr(SemaRef, ExpectedPtrTy->getTypePtr())); | ||
| 7198 | + } | ||
| 7199 | } | ||
| 7200 | if (SemaRef.Context.getCanonicalType(FirstParamType).getUnqualifiedType() != | ||
| 7201 | ExpectedFirstParamType) | ||
| 7202 | diff --git a/clang/lib/Sema/SemaLookup.cpp b/clang/lib/Sema/SemaLookup.cpp | ||
| 7203 | index 8d96404a5c27..8f21203b9508 100644 | ||
| 7204 | --- a/clang/lib/Sema/SemaLookup.cpp | ||
| 7205 | +++ b/clang/lib/Sema/SemaLookup.cpp | ||
| 7206 | @@ -771,19 +771,20 @@ static void InsertOCLBuiltinDeclarationsFromTable(Sema &S, LookupResult &LR, | ||
| 7207 | // as argument. Only meaningful for generic types, otherwise equals 1. | ||
| 7208 | unsigned GenTypeMaxCnt; | ||
| 7209 | |||
| 7210 | + ASTContext &Context = S.Context; | ||
| 7211 | + | ||
| 7212 | + // Ignore this BIF if its version does not match the language options. | ||
| 7213 | + unsigned OpenCLVersion = Context.getLangOpts().OpenCLVersion; | ||
| 7214 | + if (Context.getLangOpts().OpenCLCPlusPlus) | ||
| 7215 | + OpenCLVersion = 200; | ||
| 7216 | + | ||
| 7217 | + unsigned short VersionCode = OpenCLOptions::EncodeVersion(OpenCLVersion); | ||
| 7218 | + | ||
| 7219 | for (unsigned SignatureIndex = 0; SignatureIndex < Len; SignatureIndex++) { | ||
| 7220 | const OpenCLBuiltinStruct &OpenCLBuiltin = | ||
| 7221 | BuiltinTable[FctIndex + SignatureIndex]; | ||
| 7222 | - ASTContext &Context = S.Context; | ||
| 7223 | |||
| 7224 | - // Ignore this BIF if its version does not match the language options. | ||
| 7225 | - unsigned OpenCLVersion = Context.getLangOpts().OpenCLVersion; | ||
| 7226 | - if (Context.getLangOpts().OpenCLCPlusPlus) | ||
| 7227 | - OpenCLVersion = 200; | ||
| 7228 | - if (OpenCLVersion < OpenCLBuiltin.MinVersion) | ||
| 7229 | - continue; | ||
| 7230 | - if ((OpenCLBuiltin.MaxVersion != 0) && | ||
| 7231 | - (OpenCLVersion >= OpenCLBuiltin.MaxVersion)) | ||
| 7232 | + if (!(OpenCLBuiltin.AllVersions & VersionCode)) | ||
| 7233 | continue; | ||
| 7234 | |||
| 7235 | SmallVector<QualType, 1> RetTypes; | ||
| 7236 | diff --git a/clang/lib/Sema/SemaType.cpp b/clang/lib/Sema/SemaType.cpp | ||
| 7237 | index 93ddd047e09b..93211b801f8d 100644 | ||
| 7238 | --- a/clang/lib/Sema/SemaType.cpp | ||
| 7239 | +++ b/clang/lib/Sema/SemaType.cpp | ||
| 7240 | @@ -2016,7 +2016,7 @@ static QualType deduceOpenCLPointeeAddrSpace(Sema &S, QualType PointeeType) { | ||
| 7241 | !PointeeType.hasAddressSpace()) | ||
| 7242 | PointeeType = S.getASTContext().getAddrSpaceQualType( | ||
| 7243 | PointeeType, | ||
| 7244 | - S.getLangOpts().OpenCLCPlusPlus || S.getLangOpts().OpenCLVersion == 200 | ||
| 7245 | + S.getOpenCLOptions().isEnabled("__opencl_c_generic_address_space") | ||
| 7246 | ? LangAS::opencl_generic | ||
| 7247 | : LangAS::opencl_private); | ||
| 7248 | return PointeeType; | ||
| 7249 | @@ -5160,9 +5160,15 @@ static TypeSourceInfo *GetFullTypeForDeclarator(TypeProcessingState &state, | ||
| 7250 | } | ||
| 7251 | |||
| 7252 | case DeclaratorChunk::Pipe: { | ||
| 7253 | - T = S.BuildReadPipeType(T, DeclType.Loc); | ||
| 7254 | - processTypeAttrs(state, T, TAL_DeclSpec, | ||
| 7255 | - D.getMutableDeclSpec().getAttributes()); | ||
| 7256 | + if (S.getOpenCLOptions().isEnabled("__opencl_c_pipes")) { | ||
| 7257 | + T = S.BuildReadPipeType(T, DeclType.Loc); | ||
| 7258 | + processTypeAttrs(state, T, TAL_DeclSpec, | ||
| 7259 | + D.getMutableDeclSpec().getAttributes()); | ||
| 7260 | + } else { | ||
| 7261 | + D.setInvalidType(true); | ||
| 7262 | + T = Context.IntTy; | ||
| 7263 | + S.Diag(D.getIdentifierLoc(), diag::err_opencl_pipes_require_feat); | ||
| 7264 | + } | ||
| 7265 | break; | ||
| 7266 | } | ||
| 7267 | } | ||
| 7268 | diff --git a/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl b/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7269 | index cdbf28bbcad8..0bedff5ef0f3 100644 | ||
| 7270 | --- a/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7271 | +++ b/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7272 | @@ -2,7 +2,8 @@ | ||
| 7273 | // RUN: %clang_cc1 %s -emit-llvm -o - -O0 -triple amdgcn | FileCheck -enable-var-scope -check-prefixes=COM,AMDGCN %s | ||
| 7274 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL2.0 -O0 -triple amdgcn | FileCheck -enable-var-scope -check-prefixes=COM,AMDGCN,AMDGCN20 %s | ||
| 7275 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL1.2 -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7276 | - | ||
| 7277 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7278 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -cl-ext=__opencl_c_program_scope_global_variables -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7279 | typedef int int2 __attribute__((ext_vector_type(2))); | ||
| 7280 | |||
| 7281 | typedef struct { | ||
| 7282 | @@ -39,7 +40,7 @@ struct LargeStructTwoMember { | ||
| 7283 | int2 y[20]; | ||
| 7284 | }; | ||
| 7285 | |||
| 7286 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7287 | +#ifdef __opencl_c_program_scope_global_variables | ||
| 7288 | struct LargeStructOneMember g_s; | ||
| 7289 | #endif | ||
| 7290 | |||
| 7291 | @@ -98,7 +99,7 @@ void FuncOneLargeMember(struct LargeStructOneMember u) { | ||
| 7292 | // AMDGCN20: %[[r0:.*]] = bitcast %struct.LargeStructOneMember addrspace(5)* %[[byval_temp]] to i8 addrspace(5)* | ||
| 7293 | // AMDGCN20: call void @llvm.memcpy.p5i8.p1i8.i64(i8 addrspace(5)* align 8 %[[r0]], i8 addrspace(1)* align 8 bitcast (%struct.LargeStructOneMember addrspace(1)* @g_s to i8 addrspace(1)*), i64 800, i1 false) | ||
| 7294 | // AMDGCN20: call void @FuncOneLargeMember(%struct.LargeStructOneMember addrspace(5)* byval(%struct.LargeStructOneMember) align 8 %[[byval_temp]]) | ||
| 7295 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7296 | +#ifdef __opencl_c_program_scope_global_variables | ||
| 7297 | void test_indirect_arg_globl(void) { | ||
| 7298 | FuncOneLargeMember(g_s); | ||
| 7299 | } | ||
| 7300 | diff --git a/clang/test/CodeGenOpenCL/address-spaces-conversions.cl b/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7301 | index 52feccc540bb..9ecffcca5ee9 100644 | ||
| 7302 | --- a/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7303 | +++ b/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7304 | @@ -1,5 +1,7 @@ | ||
| 7305 | // RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -ffake-address-space-map -cl-std=CL2.0 -emit-llvm -o - | FileCheck %s | ||
| 7306 | +// RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -ffake-address-space-map -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -emit-llvm -o - | FileCheck %s | ||
| 7307 | // RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -cl-std=CL2.0 -emit-llvm -o - | FileCheck --check-prefix=CHECK-NOFAKE %s | ||
| 7308 | +// RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -emit-llvm -o - | FileCheck --check-prefix=CHECK-NOFAKE %s | ||
| 7309 | // When -ffake-address-space-map is not used, all addr space mapped to 0 for x86_64. | ||
| 7310 | |||
| 7311 | // test that we generate address space casts everywhere we need conversions of | ||
| 7312 | diff --git a/clang/test/CodeGenOpenCL/address-spaces-mangling.cl b/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7313 | index 50622f099143..e19ec8451d0d 100644 | ||
| 7314 | --- a/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7315 | +++ b/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7316 | @@ -6,6 +6,7 @@ | ||
| 7317 | // We check that the address spaces are mangled the same in both version of OpenCL | ||
| 7318 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL2.0 -emit-llvm -o - | FileCheck -check-prefix=OCL-20 %s | ||
| 7319 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL1.2 -emit-llvm -o - | FileCheck -check-prefix=OCL-12 %s | ||
| 7320 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL3.0 -emit-llvm -o - | FileCheck -check-prefix=OCL-12 %s | ||
| 7321 | |||
| 7322 | // We can't name this f as private is equivalent to default | ||
| 7323 | // no specifier given address space so we get multiple definition | ||
| 7324 | @@ -47,7 +48,7 @@ void f(constant int *arg) { } | ||
| 7325 | // OCL-20-DAG: @_Z1fPU3AS2i | ||
| 7326 | // OCL-12-DAG: @_Z1fPU3AS2i | ||
| 7327 | |||
| 7328 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7329 | +#if __OPENCL_C_VERSION__ == 200 | ||
| 7330 | __attribute__((overloadable)) | ||
| 7331 | void f(generic int *arg) { } | ||
| 7332 | // ASMANG20: @_Z1fPU3AS4i | ||
| 7333 | diff --git a/clang/test/CodeGenOpenCL/address-spaces.cl b/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7334 | index 3c8fea2a80bc..26a741338b3a 100644 | ||
| 7335 | --- a/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7336 | +++ b/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7337 | @@ -1,9 +1,13 @@ | ||
| 7338 | // RUN: %clang_cc1 %s -O0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CHECK,SPIR | ||
| 7339 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CHECK,SPIR | ||
| 7340 | // RUN: %clang_cc1 %s -O0 -DCL20 -cl-std=CL2.0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CL20,CL20SPIR | ||
| 7341 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-amd-amdhsa -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7342 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple amdgcn-amd-amdhsa -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7343 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-amd-amdhsa -DCL20 -cl-std=CL2.0 -emit-llvm -o - | FileCheck %s --check-prefixes=CL20,CL20AMDGCN | ||
| 7344 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-mesa-mesa3d -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7345 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple amdgcn-mesa-mesa3d -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7346 | // RUN: %clang_cc1 %s -O0 -triple r600-- -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7347 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple r600-- -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7348 | |||
| 7349 | // SPIR: %struct.S = type { i32, i32, i32* } | ||
| 7350 | // CL20SPIR: %struct.S = type { i32, i32, i32 addrspace(4)* } | ||
| 7351 | diff --git a/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl b/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7352 | index 7216cb517495..8d3b30fe8074 100644 | ||
| 7353 | --- a/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7354 | +++ b/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7355 | @@ -1,4 +1,5 @@ | ||
| 7356 | // RUN: %clang_cc1 -O0 -cl-std=CL1.2 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL12 %s | ||
| 7357 | +// RUN: %clang_cc1 -O0 -cl-std=CL3.0 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL12 %s | ||
| 7358 | // RUN: %clang_cc1 -O0 -cl-std=CL2.0 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL20 %s | ||
| 7359 | |||
| 7360 | // CL12-LABEL: define void @func1(i32 addrspace(5)* %x) | ||
| 7361 | diff --git a/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl b/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7362 | index a5d438933fa4..8073c7756eb6 100644 | ||
| 7363 | --- a/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7364 | +++ b/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7365 | @@ -4,6 +4,17 @@ | ||
| 7366 | // RUN: %clang_cc1 -triple amdgcn---opencl -cl-std=CL2.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7367 | // RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL1.2 %s -emit-llvm -o - | FileCheck %s | ||
| 7368 | // RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL2.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7369 | +// RUN: %clang_cc1 -triple r600 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7370 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7371 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7372 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7373 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7374 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7375 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7376 | +// RUN: %clang_cc1 -triple r600 -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7377 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7378 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7379 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7380 | |||
| 7381 | #ifdef __AMDGCN__ | ||
| 7382 | #define PTSIZE 8 | ||
| 7383 | @@ -11,7 +22,7 @@ | ||
| 7384 | #define PTSIZE 4 | ||
| 7385 | #endif | ||
| 7386 | |||
| 7387 | -#ifdef cl_khr_fp64 | ||
| 7388 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 7389 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 7390 | #endif | ||
| 7391 | #ifdef cl_khr_fp16 | ||
| 7392 | @@ -59,8 +70,12 @@ void test() { | ||
| 7393 | check(__alignof__(double) == 8); | ||
| 7394 | #endif | ||
| 7395 | |||
| 7396 | - check(sizeof(void*) == (__OPENCL_C_VERSION__ >= 200 ? 8 : 4)); | ||
| 7397 | - check(__alignof__(void*) == (__OPENCL_C_VERSION__ >= 200 ? 8 : 4)); | ||
| 7398 | + check(sizeof(private void*) == 4); | ||
| 7399 | + check(__alignof__(private void*) == 4); | ||
| 7400 | +#ifdef __opencl_c_generic_address_space | ||
| 7401 | + check(sizeof(generic void*) == 8); | ||
| 7402 | + check(__alignof__(generic void*) == 8); | ||
| 7403 | +#endif | ||
| 7404 | check(sizeof(global_ptr_t) == PTSIZE); | ||
| 7405 | check(__alignof__(global_ptr_t) == PTSIZE); | ||
| 7406 | check(sizeof(constant_ptr_t) == PTSIZE); | ||
| 7407 | diff --git a/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl b/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7408 | index d1ab6aceac5c..70c5bace023b 100644 | ||
| 7409 | --- a/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7410 | +++ b/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7411 | @@ -1,4 +1,5 @@ | ||
| 7412 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -finclude-default-header -cl-std=CL1.2 -emit-llvm -o - -O0 | FileCheck %s | ||
| 7413 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -finclude-default-header -cl-std=CL3.0 -emit-llvm -o - -O0 | FileCheck %s | ||
| 7414 | |||
| 7415 | #pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : enable | ||
| 7416 | void test_int8(uchar4 ua, uchar4 ub, char4 sa, char4 sb) { | ||
| 7417 | diff --git a/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl b/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7418 | index 76ace5dca21e..5dc43e222f75 100644 | ||
| 7419 | --- a/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7420 | +++ b/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7421 | @@ -1,6 +1,8 @@ | ||
| 7422 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL1.2 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7423 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-NONUNIFORM | ||
| 7424 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -cl-uniform-work-group-size -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7425 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-NONUNIFORM | ||
| 7426 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -cl-uniform-work-group-size -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7427 | |||
| 7428 | kernel void ker() {}; | ||
| 7429 | // CHECK: define{{.*}}@ker() #0 | ||
| 7430 | diff --git a/clang/test/CodeGenOpenCL/fpmath.cl b/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7431 | index 0108d909c94e..b28392739c71 100644 | ||
| 7432 | --- a/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7433 | +++ b/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7434 | @@ -2,6 +2,8 @@ | ||
| 7435 | // RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown -cl-fp32-correctly-rounded-divide-sqrt | FileCheck --check-prefix=CHECK --check-prefix=DIVOPT %s | ||
| 7436 | // RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL1.2 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s | ||
| 7437 | // RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL1.2 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s | ||
| 7438 | +// RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL3.0 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s | ||
| 7439 | +// RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s | ||
| 7440 | |||
| 7441 | typedef __attribute__(( ext_vector_type(4) )) float float4; | ||
| 7442 | |||
| 7443 | diff --git a/clang/test/CodeGenOpenCL/generic-address-space-feature.cl b/clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 7444 | new file mode 100644 | ||
| 7445 | index 000000000000..890860abe4d9 | ||
| 7446 | --- /dev/null | ||
| 7447 | +++ b/clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 7448 | @@ -0,0 +1,28 @@ | ||
| 7449 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL12 | ||
| 7450 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL12 | ||
| 7451 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL20 | ||
| 7452 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL20 | ||
| 7453 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL30 | ||
| 7454 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64,__opencl_c_generic_address_space -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL30-GENERIC | ||
| 7455 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL30 | ||
| 7456 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64,__opencl_c_generic_address_space -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL30-GENERIC | ||
| 7457 | + | ||
| 7458 | +void test(global float* src1, local float *src2, private float *src3, float *src4, float tmp) { | ||
| 7459 | + // CL20: %{{.+}} = addrspacecast float addrspace(1)* %{{.+}} to float addrspace(4)* | ||
| 7460 | + // CL12-NOT: addrspacecast | ||
| 7461 | + // CL30-NOT: addrspacecast | ||
| 7462 | + // CL30-GENERIC-NOT: addrspacecast | ||
| 7463 | + tmp = sincos(tmp, src1); | ||
| 7464 | + // CL20: %{{.+}} = addrspacecast float addrspace(3)* %{{.+}} to float addrspace(4)* | ||
| 7465 | + // CL12-NOT: addrspacecast | ||
| 7466 | + // CL30-NOT: addrspacecast | ||
| 7467 | + // CL30-GENERIC-NOT: addrspacecast | ||
| 7468 | + tmp = sincos(tmp, src2); | ||
| 7469 | + | ||
| 7470 | + // CL12: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float* {{.+}}) | ||
| 7471 | + // CL20: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float addrspace(4)* {{.+}}) | ||
| 7472 | + // CL30: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float* {{.+}}) | ||
| 7473 | + // CL30-GENERIC: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float addrspace(4)* {{.+}}) | ||
| 7474 | + // CHECK: addrspacecast | ||
| 7475 | + tmp = sincos(tmp, src4); | ||
| 7476 | +} | ||
| 7477 | diff --git a/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl b/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7478 | index 515f13f6e768..5aa31ac6f345 100644 | ||
| 7479 | --- a/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7480 | +++ b/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7481 | @@ -1,4 +1,5 @@ | ||
| 7482 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL1.2 -cl-ext=+cl_intel_device_side_avc_motion_estimation -emit-llvm -o - -O0 | FileCheck %s | ||
| 7483 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL3.0 -cl-ext=+cl_intel_device_side_avc_motion_estimation -emit-llvm -o - -O0 | FileCheck %s | ||
| 7484 | |||
| 7485 | // CHECK: %opencl.intel_sub_group_avc_mce_payload_t = type opaque | ||
| 7486 | // CHECK: %opencl.intel_sub_group_avc_ime_payload_t = type opaque | ||
| 7487 | diff --git a/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl b/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7488 | index e89237623478..3d6708ac361f 100644 | ||
| 7489 | --- a/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7490 | +++ b/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7491 | @@ -1,5 +1,8 @@ | ||
| 7492 | // RUN: %clang_cc1 %s -cl-std=CL1.2 -emit-llvm -triple x86_64-unknown-unknown -o - | FileCheck %s | ||
| 7493 | // RUN: %clang_cc1 %s -cl-std=CL1.2 -emit-llvm -triple amdgcn-unknown-unknown -o - | FileCheck -check-prefixes=AMDGCN %s | ||
| 7494 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -triple x86_64-unknown-unknown -o - | FileCheck %s | ||
| 7495 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -triple amdgcn-unknown-unknown -o - | FileCheck -check-prefixes=AMDGCN %s | ||
| 7496 | + | ||
| 7497 | // Test that the kernels always use the SPIR calling convention | ||
| 7498 | // to have unambiguous mapping of arguments to feasibly implement | ||
| 7499 | // clSetKernelArg(). | ||
| 7500 | diff --git a/clang/test/CodeGenOpenCL/logical-ops.cl b/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7501 | index f083a8580ee7..499eab65039b 100644 | ||
| 7502 | --- a/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7503 | +++ b/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7504 | @@ -1,4 +1,5 @@ | ||
| 7505 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL1.2 -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7506 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7507 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=clc++ -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7508 | |||
| 7509 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 7510 | diff --git a/clang/test/CodeGenOpenCL/no-half.cl b/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7511 | index aee8f678f01a..46da7fa339e8 100644 | ||
| 7512 | --- a/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7513 | +++ b/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7514 | @@ -1,6 +1,7 @@ | ||
| 7515 | // RUN: %clang_cc1 %s -cl-std=cl2.0 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7516 | // RUN: %clang_cc1 %s -cl-std=cl1.2 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7517 | // RUN: %clang_cc1 %s -cl-std=cl1.1 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7518 | +// RUN: %clang_cc1 %s -cl-std=cl3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7519 | |||
| 7520 | #pragma OPENCL EXTENSION cl_khr_fp64:enable | ||
| 7521 | |||
| 7522 | diff --git a/clang/test/CodeGenOpenCL/pipe_builtin.cl b/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7523 | index 02b9669b7ab1..0bf35c336199 100644 | ||
| 7524 | --- a/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7525 | +++ b/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7526 | @@ -1,4 +1,7 @@ | ||
| 7527 | // RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=clc++ -o - %s | FileCheck %s | ||
| 7528 | +// RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=cl2.0 -o - %s | FileCheck %s | ||
| 7529 | +// RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=cl3.0 -cl-ext=__opencl_c_pipes,__opencl_c_subgroups -o - %s | FileCheck %s | ||
| 7530 | + | ||
| 7531 | // FIXME: Add MS ABI manglings of OpenCL things and remove %itanium_abi_triple | ||
| 7532 | // above to support OpenCL in the MS C++ ABI. | ||
| 7533 | |||
| 7534 | diff --git a/clang/test/CodeGenOpenCL/pipe_types.cl b/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7535 | index ba064c6d7557..b7a523d4f084 100644 | ||
| 7536 | --- a/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7537 | +++ b/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7538 | @@ -1,4 +1,5 @@ | ||
| 7539 | // RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -emit-llvm -O0 -cl-std=CL2.0 -o - %s | FileCheck %s | ||
| 7540 | +// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -emit-llvm -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -o - %s | FileCheck %s | ||
| 7541 | |||
| 7542 | // CHECK: %opencl.pipe_ro_t = type opaque | ||
| 7543 | // CHECK: %opencl.pipe_wo_t = type opaque | ||
| 7544 | diff --git a/clang/test/CodeGenOpenCL/printf.cl b/clang/test/CodeGenOpenCL/printf.cl | ||
| 7545 | index fc139d776db6..0133c5595d81 100644 | ||
| 7546 | --- a/clang/test/CodeGenOpenCL/printf.cl | ||
| 7547 | +++ b/clang/test/CodeGenOpenCL/printf.cl | ||
| 7548 | @@ -1,5 +1,7 @@ | ||
| 7549 | // RUN: %clang_cc1 -cl-std=CL1.2 -cl-ext=-+cl_khr_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=FP64,ALL %s | ||
| 7550 | // RUN: %clang_cc1 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=NOFP64,ALL %s | ||
| 7551 | +// RUN: %clang_cc1 -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=FP64,ALL %s | ||
| 7552 | +// RUN: %clang_cc1 -cl-std=CL3.0 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=NOFP64,ALL %s | ||
| 7553 | |||
| 7554 | typedef __attribute__((ext_vector_type(2))) float float2; | ||
| 7555 | typedef __attribute__((ext_vector_type(2))) half half2; | ||
| 7556 | diff --git a/clang/test/CodeGenOpenCL/unroll-hint.cl b/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7557 | index 0f84450a1ae6..9347c935869b 100644 | ||
| 7558 | --- a/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7559 | +++ b/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7560 | @@ -1,5 +1,6 @@ | ||
| 7561 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -o - %s | FileCheck %s | ||
| 7562 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL1.2 -o - %s | FileCheck %s | ||
| 7563 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -o - %s | FileCheck %s | ||
| 7564 | |||
| 7565 | /*** for ***/ | ||
| 7566 | void for_count() | ||
| 7567 | diff --git a/clang/test/Driver/autocomplete.c b/clang/test/Driver/autocomplete.c | ||
| 7568 | index 5c0bfb69f9a3..eabdf0b5938d 100644 | ||
| 7569 | --- a/clang/test/Driver/autocomplete.c | ||
| 7570 | +++ b/clang/test/Driver/autocomplete.c | ||
| 7571 | @@ -43,6 +43,8 @@ | ||
| 7572 | // CLSTDALL-NEXT: CL1.2 | ||
| 7573 | // CLSTDALL-NEXT: cl2.0 | ||
| 7574 | // CLSTDALL-NEXT: CL2.0 | ||
| 7575 | +// CLSTDALL-NEXT: cl3.0 | ||
| 7576 | +// CLSTDALL-NEXT: CL3.0 | ||
| 7577 | // CLSTDALL-NEXT: clc++ | ||
| 7578 | // CLSTDALL-NEXT: CLC++ | ||
| 7579 | // RUN: %clang --autocomplete=-fno-sanitize-coverage=,f | FileCheck %s -check-prefix=FNOSANICOVER | ||
| 7580 | diff --git a/clang/test/Driver/opencl.cl b/clang/test/Driver/opencl.cl | ||
| 7581 | index 63b04bc1af41..ffdd4f7d65bb 100644 | ||
| 7582 | --- a/clang/test/Driver/opencl.cl | ||
| 7583 | +++ b/clang/test/Driver/opencl.cl | ||
| 7584 | @@ -2,6 +2,7 @@ | ||
| 7585 | // RUN: %clang -S -### -cl-std=CL1.1 %s 2>&1 | FileCheck --check-prefix=CHECK-CL11 %s | ||
| 7586 | // RUN: %clang -S -### -cl-std=CL1.2 %s 2>&1 | FileCheck --check-prefix=CHECK-CL12 %s | ||
| 7587 | // RUN: %clang -S -### -cl-std=CL2.0 %s 2>&1 | FileCheck --check-prefix=CHECK-CL20 %s | ||
| 7588 | +// RUN: %clang -S -### -cl-std=CL3.0 %s 2>&1 | FileCheck --check-prefix=CHECK-CL30 %s | ||
| 7589 | // RUN: %clang -S -### -cl-std=clc++ %s 2>&1 | FileCheck --check-prefix=CHECK-CLCPP %s | ||
| 7590 | // RUN: %clang -S -### -cl-opt-disable %s 2>&1 | FileCheck --check-prefix=CHECK-OPT-DISABLE %s | ||
| 7591 | // RUN: %clang -S -### -cl-strict-aliasing %s 2>&1 | FileCheck --check-prefix=CHECK-STRICT-ALIASING %s | ||
| 7592 | @@ -22,6 +23,7 @@ | ||
| 7593 | // CHECK-CL11: "-cc1" {{.*}} "-cl-std=CL1.1" | ||
| 7594 | // CHECK-CL12: "-cc1" {{.*}} "-cl-std=CL1.2" | ||
| 7595 | // CHECK-CL20: "-cc1" {{.*}} "-cl-std=CL2.0" | ||
| 7596 | +// CHECK-CL30: "-cc1" {{.*}} "-cl-std=CL3.0" | ||
| 7597 | // CHECK-CLCPP: "-cc1" {{.*}} "-cl-std=clc++" | ||
| 7598 | // CHECK-OPT-DISABLE: "-cc1" {{.*}} "-cl-opt-disable" | ||
| 7599 | // CHECK-STRICT-ALIASING: "-cc1" {{.*}} "-cl-strict-aliasing" | ||
| 7600 | diff --git a/clang/test/Driver/unknown-std.cl b/clang/test/Driver/unknown-std.cl | ||
| 7601 | index 6f371bac13ac..00209fb62556 100644 | ||
| 7602 | --- a/clang/test/Driver/unknown-std.cl | ||
| 7603 | +++ b/clang/test/Driver/unknown-std.cl | ||
| 7604 | @@ -10,6 +10,7 @@ | ||
| 7605 | // CHECK-NEXT: note: use 'cl1.1' for 'OpenCL 1.1' standard | ||
| 7606 | // CHECK-NEXT: note: use 'cl1.2' for 'OpenCL 1.2' standard | ||
| 7607 | // CHECK-NEXT: note: use 'cl2.0' for 'OpenCL 2.0' standard | ||
| 7608 | +// CHECK-NEXT: note: use 'cl3.0' for 'OpenCL 3.0' standard | ||
| 7609 | // CHECK-NEXT: note: use 'clc++' for 'C++ for OpenCL' standard | ||
| 7610 | |||
| 7611 | // Make sure that no other output is present. | ||
| 7612 | diff --git a/clang/test/Frontend/stdlang.c b/clang/test/Frontend/stdlang.c | ||
| 7613 | index 51484999e37a..eac4632fbdd6 100644 | ||
| 7614 | --- a/clang/test/Frontend/stdlang.c | ||
| 7615 | +++ b/clang/test/Frontend/stdlang.c | ||
| 7616 | @@ -9,6 +9,7 @@ | ||
| 7617 | // RUN: %clang_cc1 -x cl -cl-std=CL1.1 -DOPENCL %s | ||
| 7618 | // RUN: %clang_cc1 -x cl -cl-std=CL1.2 -DOPENCL %s | ||
| 7619 | // RUN: %clang_cc1 -x cl -cl-std=CL2.0 -DOPENCL %s | ||
| 7620 | +// RUN: %clang_cc1 -x cl -cl-std=CL3.0 -DOPENCL %s | ||
| 7621 | // RUN: %clang_cc1 -x cl -cl-std=CLC++ -DOPENCL %s | ||
| 7622 | // RUN: not %clang_cc1 -x cl -std=c99 -DOPENCL %s 2>&1 | FileCheck --check-prefix=CHECK-C99 %s | ||
| 7623 | // RUN: not %clang_cc1 -x cl -cl-std=invalid -DOPENCL %s 2>&1 | FileCheck --check-prefix=CHECK-INVALID %s | ||
| 7624 | diff --git a/clang/test/Headers/opencl-c-header.cl b/clang/test/Headers/opencl-c-header.cl | ||
| 7625 | index 1b151ffdd16a..2716076acdcf 100644 | ||
| 7626 | --- a/clang/test/Headers/opencl-c-header.cl | ||
| 7627 | +++ b/clang/test/Headers/opencl-c-header.cl | ||
| 7628 | @@ -1,6 +1,7 @@ | ||
| 7629 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify | FileCheck %s | ||
| 7630 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL1.1 | FileCheck %s | ||
| 7631 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL1.2 | FileCheck %s | ||
| 7632 | +// RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL3.0 | FileCheck %s | ||
| 7633 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=clc++ | FileCheck %s --check-prefix=CHECK20 | ||
| 7634 | |||
| 7635 | // Test including the default header as a module. | ||
| 7636 | @@ -39,9 +40,11 @@ | ||
| 7637 | // RUN: rm -rf %t | ||
| 7638 | // RUN: mkdir -p %t | ||
| 7639 | // RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL1.2 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7640 | +// RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL3.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7641 | // RUN: %clang_cc1 -triple amdgcn--amdhsa -O0 -emit-llvm -o - -cl-std=CL2.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK20 --check-prefix=CHECK-MOD %s | ||
| 7642 | // RUN: chmod u-w %t | ||
| 7643 | // RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL1.2 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7644 | +// RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL3.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7645 | // RUN: %clang_cc1 -triple amdgcn--amdhsa -O0 -emit-llvm -o - -cl-std=CL2.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK20 --check-prefix=CHECK-MOD %s | ||
| 7646 | // RUN: chmod u+w %t | ||
| 7647 | |||
| 7648 | @@ -67,7 +70,7 @@ char f(char x) { | ||
| 7649 | // from OpenCL 2.0 onwards. | ||
| 7650 | |||
| 7651 | // CHECK20: _Z12write_imagef14ocl_image3d_wo | ||
| 7652 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 7653 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 7654 | void test_image3dwo(write_only image3d_t img) { | ||
| 7655 | write_imagef(img, (0), (0.0f)); | ||
| 7656 | } | ||
| 7657 | @@ -81,7 +84,7 @@ void test_atomics(__generic volatile unsigned int* a) { | ||
| 7658 | #endif | ||
| 7659 | |||
| 7660 | // Verify that ATOMIC_VAR_INIT is defined. | ||
| 7661 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 7662 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 7663 | global atomic_int z = ATOMIC_VAR_INIT(99); | ||
| 7664 | #endif //__OPENCL_C_VERSION__ | ||
| 7665 | |||
| 7666 | diff --git a/clang/test/Index/pipe-size.cl b/clang/test/Index/pipe-size.cl | ||
| 7667 | index 94a1255f0a48..59b76051eda1 100644 | ||
| 7668 | --- a/clang/test/Index/pipe-size.cl | ||
| 7669 | +++ b/clang/test/Index/pipe-size.cl | ||
| 7670 | @@ -2,6 +2,13 @@ | ||
| 7671 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple spir-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR | ||
| 7672 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple spir64-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR64 | ||
| 7673 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple amdgcn-amd-amdhsa %s -o - | FileCheck %s --check-prefix=AMDGCN | ||
| 7674 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple x86_64-unknown-linux-gnu %s -o - | FileCheck %s --check-prefix=X86 | ||
| 7675 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple spir-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR | ||
| 7676 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple spir64-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR64 | ||
| 7677 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple amdgcn-amd-amdhsa %s -o - | FileCheck %s --check-prefix=AMDGCN | ||
| 7678 | + | ||
| 7679 | + | ||
| 7680 | + | ||
| 7681 | __kernel void testPipe( pipe int test ) | ||
| 7682 | { | ||
| 7683 | int s = sizeof(test); | ||
| 7684 | diff --git a/clang/test/Preprocessor/predefined-macros.c b/clang/test/Preprocessor/predefined-macros.c | ||
| 7685 | index def105f4c52e..b088a37ba665 100644 | ||
| 7686 | --- a/clang/test/Preprocessor/predefined-macros.c | ||
| 7687 | +++ b/clang/test/Preprocessor/predefined-macros.c | ||
| 7688 | @@ -129,6 +129,8 @@ | ||
| 7689 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL12 | ||
| 7690 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=CL2.0 \ | ||
| 7691 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL20 | ||
| 7692 | +// RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=CL3.0 \ | ||
| 7693 | +// RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL30 | ||
| 7694 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-fast-relaxed-math \ | ||
| 7695 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-FRM | ||
| 7696 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=clc++ \ | ||
| 7697 | @@ -137,26 +139,37 @@ | ||
| 7698 | // CHECK-CL10: #define CL_VERSION_1_1 110 | ||
| 7699 | // CHECK-CL10: #define CL_VERSION_1_2 120 | ||
| 7700 | // CHECK-CL10: #define CL_VERSION_2_0 200 | ||
| 7701 | +// CHECK-CL10: #define CL_VERSION_3_0 300 | ||
| 7702 | // CHECK-CL10: #define __OPENCL_C_VERSION__ 100 | ||
| 7703 | // CHECK-CL10-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7704 | // CHECK-CL11: #define CL_VERSION_1_0 100 | ||
| 7705 | // CHECK-CL11: #define CL_VERSION_1_1 110 | ||
| 7706 | // CHECK-CL11: #define CL_VERSION_1_2 120 | ||
| 7707 | // CHECK-CL11: #define CL_VERSION_2_0 200 | ||
| 7708 | +// CHECK-CL11: #define CL_VERSION_3_0 300 | ||
| 7709 | // CHECK-CL11: #define __OPENCL_C_VERSION__ 110 | ||
| 7710 | // CHECK-CL11-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7711 | // CHECK-CL12: #define CL_VERSION_1_0 100 | ||
| 7712 | // CHECK-CL12: #define CL_VERSION_1_1 110 | ||
| 7713 | // CHECK-CL12: #define CL_VERSION_1_2 120 | ||
| 7714 | // CHECK-CL12: #define CL_VERSION_2_0 200 | ||
| 7715 | +// CHECK-CL12: #define CL_VERSION_3_0 300 | ||
| 7716 | // CHECK-CL12: #define __OPENCL_C_VERSION__ 120 | ||
| 7717 | // CHECK-CL12-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7718 | // CHECK-CL20: #define CL_VERSION_1_0 100 | ||
| 7719 | // CHECK-CL20: #define CL_VERSION_1_1 110 | ||
| 7720 | // CHECK-CL20: #define CL_VERSION_1_2 120 | ||
| 7721 | // CHECK-CL20: #define CL_VERSION_2_0 200 | ||
| 7722 | +// CHECK-CL20: #define CL_VERSION_3_0 300 | ||
| 7723 | // CHECK-CL20: #define __OPENCL_C_VERSION__ 200 | ||
| 7724 | // CHECK-CL20-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7725 | +// CHECK-CL30: #define CL_VERSION_1_0 100 | ||
| 7726 | +// CHECK-CL30: #define CL_VERSION_1_1 110 | ||
| 7727 | +// CHECK-CL30: #define CL_VERSION_1_2 120 | ||
| 7728 | +// CHECK-CL30: #define CL_VERSION_2_0 200 | ||
| 7729 | +// CHECK-CL30: #define CL_VERSION_3_0 300 | ||
| 7730 | +// CHECK-CL30: #define __OPENCL_C_VERSION__ 300 | ||
| 7731 | +// CHECK-CL30-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7732 | // CHECK-FRM: #define __FAST_RELAXED_MATH__ 1 | ||
| 7733 | // CHECK-CLCPP10: #define __CL_CPP_VERSION_1_0__ 100 | ||
| 7734 | // CHECK-CLCPP10: #define __OPENCL_CPP_VERSION__ 100 | ||
| 7735 | diff --git a/clang/test/Sema/feature-extensions-simult-support.cl b/clang/test/Sema/feature-extensions-simult-support.cl | ||
| 7736 | new file mode 100644 | ||
| 7737 | index 000000000000..0789105002b2 | ||
| 7738 | --- /dev/null | ||
| 7739 | +++ b/clang/test/Sema/feature-extensions-simult-support.cl | ||
| 7740 | @@ -0,0 +1,75 @@ | ||
| 7741 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 | ||
| 7742 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_fp64 | ||
| 7743 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_3d_image_writes | ||
| 7744 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_3d_image_writes | ||
| 7745 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_subgroups | ||
| 7746 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_subgroups | ||
| 7747 | + | ||
| 7748 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 | ||
| 7749 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_fp64 | ||
| 7750 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_3d_image_writes | ||
| 7751 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_3d_image_writes | ||
| 7752 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_subgroups | ||
| 7753 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_subgroups | ||
| 7754 | + | ||
| 7755 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64 | ||
| 7756 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_3d_image_writes | ||
| 7757 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_subgroups | ||
| 7758 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_pipes | ||
| 7759 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_device_enqueue | ||
| 7760 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_read_write_images | ||
| 7761 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64,-cl_khr_fp64 | ||
| 7762 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_3d_image_writes,-cl_khr_3d_image_writes | ||
| 7763 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_subgroups,-cl_khr_subgroups | ||
| 7764 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_fp64 | ||
| 7765 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_3d_image_writes | ||
| 7766 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_subgroups | ||
| 7767 | + | ||
| 7768 | +// expected-no-diagnostics | ||
| 7769 | + | ||
| 7770 | +#ifdef cl_khr_fp64 | ||
| 7771 | + #ifndef __opencl_c_fp64 | ||
| 7772 | + #error macros were not properly set up | ||
| 7773 | + #endif | ||
| 7774 | +#endif | ||
| 7775 | +#ifdef __opencl_c_fp64 | ||
| 7776 | + #ifndef cl_khr_fp64 | ||
| 7777 | + #error macros were not properly set up | ||
| 7778 | + #endif | ||
| 7779 | +#endif | ||
| 7780 | + | ||
| 7781 | +#ifdef cl_khr_3d_image_writes | ||
| 7782 | + #ifndef __opencl_c_3d_image_writes | ||
| 7783 | + #error macros were not properly set up | ||
| 7784 | + #endif | ||
| 7785 | +#endif | ||
| 7786 | +#ifdef __opencl_c_3d_image_writes | ||
| 7787 | + #ifndef cl_khr_3d_image_writes | ||
| 7788 | + #error macros were not properly set up | ||
| 7789 | + #endif | ||
| 7790 | +#endif | ||
| 7791 | + | ||
| 7792 | +#ifdef cl_khr_subgroups | ||
| 7793 | + #ifndef __opencl_c_subgroups | ||
| 7794 | + #error macros were not properly set up | ||
| 7795 | + #endif | ||
| 7796 | +#endif | ||
| 7797 | +#ifdef __opencl_c_subgroups | ||
| 7798 | + #ifndef cl_khr_subgroups | ||
| 7799 | + #error macros were not properly set up | ||
| 7800 | + #endif | ||
| 7801 | +#endif | ||
| 7802 | + | ||
| 7803 | +#if defined(__opencl_c_pipes) || defined(__opencl_c_device_enqueue) | ||
| 7804 | + #ifndef __opencl_c_generic_address_space | ||
| 7805 | + #error macros were not properly set up | ||
| 7806 | + #endif | ||
| 7807 | +#endif | ||
| 7808 | + | ||
| 7809 | +#if defined(__opencl_c_3d_image_writes) || defined(__opencl_c_read_write_images) | ||
| 7810 | + #ifndef __opencl_c_images | ||
| 7811 | + #error macros were not properly set up | ||
| 7812 | + #endif | ||
| 7813 | +#endif | ||
| 7814 | + | ||
| 7815 | +kernel void test(){} | ||
| 7816 | diff --git a/clang/test/Sema/features-ignore-pragma.cl b/clang/test/Sema/features-ignore-pragma.cl | ||
| 7817 | new file mode 100644 | ||
| 7818 | index 000000000000..046ce5390754 | ||
| 7819 | --- /dev/null | ||
| 7820 | +++ b/clang/test/Sema/features-ignore-pragma.cl | ||
| 7821 | @@ -0,0 +1,24 @@ | ||
| 7822 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 7823 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 | ||
| 7824 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_subgroups | ||
| 7825 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_3d_image_writes | ||
| 7826 | + | ||
| 7827 | +#pragma OPENCL EXTENSION __opencl_c_fp64 : enable | ||
| 7828 | +// expected-warning@-1 {{OpenCL feature support can't be controlled via pragma, ignoring}} | ||
| 7829 | + | ||
| 7830 | +#pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 7831 | +#ifndef __opencl_c_fp64 | ||
| 7832 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_fp64' - ignoring}} | ||
| 7833 | +#endif | ||
| 7834 | + | ||
| 7835 | +#pragma OPENCL EXTENSION cl_khr_subgroups : enable | ||
| 7836 | +#ifndef __opencl_c_subgroups | ||
| 7837 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_subgroups' - ignoring}} | ||
| 7838 | +#endif | ||
| 7839 | + | ||
| 7840 | +#pragma OPENCL EXTENSION cl_khr_3d_image_writes : enable | ||
| 7841 | +#ifndef __opencl_c_3d_image_writes | ||
| 7842 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_3d_image_writes' - ignoring}} | ||
| 7843 | +#endif | ||
| 7844 | + | ||
| 7845 | +kernel void foo() {} | ||
| 7846 | diff --git a/clang/test/Sema/opencl-features-pipes.cl b/clang/test/Sema/opencl-features-pipes.cl | ||
| 7847 | new file mode 100644 | ||
| 7848 | index 000000000000..c0ac778f24a6 | ||
| 7849 | --- /dev/null | ||
| 7850 | +++ b/clang/test/Sema/opencl-features-pipes.cl | ||
| 7851 | @@ -0,0 +1,18 @@ | ||
| 7852 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.1 | ||
| 7853 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 | ||
| 7854 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -DHAS | ||
| 7855 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 7856 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -DHAS | ||
| 7857 | +// expected-no-diagnostics | ||
| 7858 | + | ||
| 7859 | +#ifdef HAS | ||
| 7860 | + #ifndef __opencl_c_pipes | ||
| 7861 | + #error Feature should be defined | ||
| 7862 | + #endif | ||
| 7863 | +#else | ||
| 7864 | + #ifdef __opencl_c_pipes | ||
| 7865 | + #error Feature should not be defined | ||
| 7866 | + #endif | ||
| 7867 | +#endif | ||
| 7868 | + | ||
| 7869 | +kernel void foo() {} | ||
| 7870 | diff --git a/clang/test/Sema/opencl-features.cl b/clang/test/Sema/opencl-features.cl | ||
| 7871 | new file mode 100644 | ||
| 7872 | index 000000000000..aa432f6b60bf | ||
| 7873 | --- /dev/null | ||
| 7874 | +++ b/clang/test/Sema/opencl-features.cl | ||
| 7875 | @@ -0,0 +1,128 @@ | ||
| 7876 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 | ||
| 7877 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-__opencl_c_device_enqueue,-__opencl_c_pipes,-__opencl_c_read_write_images | ||
| 7878 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CLC++ | ||
| 7879 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 7880 | +// expected-no-diagnostics | ||
| 7881 | + | ||
| 7882 | +#ifndef __opencl_c_int64 | ||
| 7883 | + #error Feature __opencl_c_int64 shouldn't be defined | ||
| 7884 | +#endif | ||
| 7885 | + | ||
| 7886 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 7887 | + #ifndef __opencl_c_3d_image_writes | ||
| 7888 | + #error Feature __opencl_c_3d_image_writes should be defined | ||
| 7889 | + #endif | ||
| 7890 | + | ||
| 7891 | + #ifndef __opencl_c_atomic_order_acq_rel | ||
| 7892 | + #error Feature __opencl_c_atomic_order_acq_rel should be defined | ||
| 7893 | + #endif | ||
| 7894 | + | ||
| 7895 | + #ifndef __opencl_c_atomic_order_seq_cst | ||
| 7896 | + #error Feature __opencl_c_atomic_order_seq_cst should be defined | ||
| 7897 | + #endif | ||
| 7898 | + | ||
| 7899 | + #ifndef __opencl_c_atomic_scope_device | ||
| 7900 | + #error Feature __opencl_c_atomic_scope_device should be defined | ||
| 7901 | + #endif | ||
| 7902 | + | ||
| 7903 | + #ifndef __opencl_c_atomic_scope_all_devices | ||
| 7904 | + #error Feature __opencl_c_atomic_scope_all_devices should be defined | ||
| 7905 | + #endif | ||
| 7906 | + | ||
| 7907 | + #ifndef __opencl_c_device_enqueue | ||
| 7908 | + #error Feature __opencl_c_device_enqueue should be defined | ||
| 7909 | + #endif | ||
| 7910 | + | ||
| 7911 | + #ifndef __opencl_c_generic_address_space | ||
| 7912 | + #error Feature __opencl_c_generic_address_space should be defined | ||
| 7913 | + #endif | ||
| 7914 | + | ||
| 7915 | + #ifndef __opencl_c_pipes | ||
| 7916 | + #error Feature __opencl_c_pipes should be defined | ||
| 7917 | + #endif | ||
| 7918 | + | ||
| 7919 | + #ifndef __opencl_c_program_scope_global_variables | ||
| 7920 | + #error Feature __opencl_c_program_scope_global_variables should be defined | ||
| 7921 | + #endif | ||
| 7922 | + | ||
| 7923 | + #ifndef __opencl_c_read_write_images | ||
| 7924 | + #error Feature __opencl_c_read_write_images should be defined | ||
| 7925 | + #endif | ||
| 7926 | + | ||
| 7927 | + #ifndef __opencl_c_subgroups | ||
| 7928 | + #error Feature __opencl_c_subgroups should be defined | ||
| 7929 | + #endif | ||
| 7930 | + | ||
| 7931 | + #ifndef __opencl_c_work_group_collective_functions | ||
| 7932 | + #error Feature __opencl_c_work_group_collective_functions should be defined | ||
| 7933 | + #endif | ||
| 7934 | + | ||
| 7935 | + #ifndef __opencl_c_fp64 | ||
| 7936 | + #error Feature __opencl_c_fp64 should be defined | ||
| 7937 | + #endif | ||
| 7938 | + | ||
| 7939 | + #ifndef __opencl_c_images | ||
| 7940 | + #error Feature __opencl_c_images should be defined | ||
| 7941 | + #endif | ||
| 7942 | +#endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 7943 | + | ||
| 7944 | + | ||
| 7945 | +#if __OPENCL_C_VERSION__ == CL_VERSION_3_0 | ||
| 7946 | + #ifdef __opencl_c_3d_image_writes | ||
| 7947 | + #error Feature __opencl_c_3d_image_writes shouldn't be defined | ||
| 7948 | + #endif | ||
| 7949 | + | ||
| 7950 | + #ifdef __opencl_c_atomic_order_acq_rel | ||
| 7951 | + #error Feature __opencl_c_atomic_order_acq_rel shouldn't be defined | ||
| 7952 | + #endif | ||
| 7953 | + | ||
| 7954 | + #ifdef __opencl_c_atomic_order_seq_cst | ||
| 7955 | + #error Feature __opencl_c_atomic_order_seq_cst shouldn't be defined | ||
| 7956 | + #endif | ||
| 7957 | + | ||
| 7958 | + #ifdef __opencl_c_atomic_scope_device | ||
| 7959 | + #error Feature __opencl_c_atomic_scope_device shouldn't be defined | ||
| 7960 | + #endif | ||
| 7961 | + | ||
| 7962 | + #ifdef __opencl_c_atomic_scope_all_devices | ||
| 7963 | + #error Feature __opencl_c_atomic_scope_all_devices shouldn't be defined | ||
| 7964 | + #endif | ||
| 7965 | + | ||
| 7966 | + #ifdef __opencl_c_device_enqueue | ||
| 7967 | + #error Feature __opencl_c_device_enqueue shouldn't be defined | ||
| 7968 | + #endif | ||
| 7969 | + | ||
| 7970 | + #ifdef __opencl_c_generic_address_space | ||
| 7971 | + #error Feature __opencl_c_generic_address_space shouldn't be defined | ||
| 7972 | + #endif | ||
| 7973 | + | ||
| 7974 | + #ifdef __opencl_c_pipes | ||
| 7975 | + #error Feature __opencl_c_pipes shouldn't be defined | ||
| 7976 | + #endif | ||
| 7977 | + | ||
| 7978 | + #ifdef __opencl_c_program_scope_global_variables | ||
| 7979 | + #error Feature __opencl_c_program_scope_global_variables shouldn't be defined | ||
| 7980 | + #endif | ||
| 7981 | + | ||
| 7982 | + #ifdef __opencl_c_read_write_images | ||
| 7983 | + #error Feature __opencl_c_read_write_images shouldn't be defined | ||
| 7984 | + #endif | ||
| 7985 | + | ||
| 7986 | + #ifdef __opencl_c_subgroups | ||
| 7987 | + #error Feature __opencl_c_subgroups shouldn't be defined | ||
| 7988 | + #endif | ||
| 7989 | + | ||
| 7990 | + #ifdef __opencl_c_work_group_collective_functions | ||
| 7991 | + #error Feature __opencl_c_work_group_collective_functions shouldn't be defined | ||
| 7992 | + #endif | ||
| 7993 | + | ||
| 7994 | + #ifdef __opencl_c_fp64 | ||
| 7995 | + #error Feature __opencl_c_fp64 shouldn't be defined | ||
| 7996 | + #endif | ||
| 7997 | + | ||
| 7998 | + #ifdef __opencl_c_images | ||
| 7999 | + #error Feature __opencl_c_images shouldn't be defined | ||
| 8000 | + #endif | ||
| 8001 | +#endif // __OPENCL_C_VERSION__ == CL_VERSION_3_0 | ||
| 8002 | + | ||
| 8003 | +kernel void foo() {} | ||
| 8004 | diff --git a/clang/test/Sema/pipe_builtins_feature.cl b/clang/test/Sema/pipe_builtins_feature.cl | ||
| 8005 | new file mode 100644 | ||
| 8006 | index 000000000000..56fa94fc7705 | ||
| 8007 | --- /dev/null | ||
| 8008 | +++ b/clang/test/Sema/pipe_builtins_feature.cl | ||
| 8009 | @@ -0,0 +1,21 @@ | ||
| 8010 | +// RUN: %clang_cc1 -cl-std=CL2.0 -fsyntax-only -verify %s | ||
| 8011 | +// RUN: %clang_cc1 -cl-std=CL3.0 -fsyntax-only -verify %s | ||
| 8012 | +// RUN: %clang_cc1 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -fsyntax-only -verify %s | ||
| 8013 | + | ||
| 8014 | +#ifdef __opencl_c_pipes | ||
| 8015 | + #ifndef __opencl_c_generic_address_space | ||
| 8016 | + #error Generic address space feature must also be defined | ||
| 8017 | + #endif | ||
| 8018 | +// CHECK: expected-no-diagnostics | ||
| 8019 | +// check that pragma disable all doesn't touch feature support | ||
| 8020 | + #pragma OPENCL EXTENSION all : disable | ||
| 8021 | +#endif | ||
| 8022 | + | ||
| 8023 | +void test(read_only pipe int p, global int *ptr) { | ||
| 8024 | + reserve_id_t rid; | ||
| 8025 | +} | ||
| 8026 | + | ||
| 8027 | +#ifndef __opencl_c_pipes | ||
| 8028 | +// expected-error@-5 {{expected parameter declarator}} expected-error@-5 {{expected ')'}} expected-note@-5 {{to match this '('}} | ||
| 8029 | +// expected-error@-5 {{use of type 'reserve_id_t' requires __opencl_c_pipes extension to be enabled}} | ||
| 8030 | +#endif | ||
| 8031 | diff --git a/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl b/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8032 | index 5efea216346a..09aea27ae6de 100644 | ||
| 8033 | --- a/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8034 | +++ b/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8035 | @@ -1,6 +1,9 @@ | ||
| 8036 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=CL2.0 | ||
| 8037 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=CL2.0 | ||
| 8038 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=CL2.0 | ||
| 8039 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8040 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8041 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8042 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=clc++ | ||
| 8043 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=clc++ | ||
| 8044 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=clc++ | ||
| 8045 | diff --git a/clang/test/SemaOpenCL/address-spaces.cl b/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8046 | index 07547ea19680..e367a7c57292 100644 | ||
| 8047 | --- a/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8048 | +++ b/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8049 | @@ -1,5 +1,6 @@ | ||
| 8050 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only | ||
| 8051 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -verify -pedantic -fsyntax-only | ||
| 8052 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -verify -pedantic -fsyntax-only | ||
| 8053 | // RUN: %clang_cc1 %s -cl-std=clc++ -verify -pedantic -fsyntax-only | ||
| 8054 | |||
| 8055 | __constant int ci = 1; | ||
| 8056 | diff --git a/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl b/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8057 | index f63e2913c749..727141190a0b 100644 | ||
| 8058 | --- a/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8059 | +++ b/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8060 | @@ -2,6 +2,12 @@ | ||
| 8061 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir-unknown-unknown" -verify -pedantic -fsyntax-only -DB32 -DQUALS="const volatile" | ||
| 8062 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir64-unknown-unknown" -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS= | ||
| 8063 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir64-unknown-unknown" -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS="const volatile" | ||
| 8064 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -DB32 -DQUALS= | ||
| 8065 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -DB32 -DQUALS="const volatile" | ||
| 8066 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir64-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS= | ||
| 8067 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir64-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS="const volatile" | ||
| 8068 | + | ||
| 8069 | + | ||
| 8070 | |||
| 8071 | typedef struct {int a;} ndrange_t; | ||
| 8072 | // Diagnostic tests for different overloads of enqueue_kernel from Table 6.13.17.1 of OpenCL 2.0 Spec. | ||
| 8073 | @@ -235,11 +241,17 @@ kernel void bar(global unsigned int *buf) | ||
| 8074 | kernel void foo1(global unsigned int *buf) | ||
| 8075 | { | ||
| 8076 | ndrange_t n; | ||
| 8077 | - buf[0] = get_kernel_max_sub_group_size_for_ndrange(n, ^(){}); // expected-error {{use of declaration 'get_kernel_max_sub_group_size_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8078 | + buf[0] = get_kernel_max_sub_group_size_for_ndrange(n, ^(){}); | ||
| 8079 | +#if __OPENCL_C_VERSION__ < 300 | ||
| 8080 | +// expected-error@-2 {{use of declaration 'get_kernel_max_sub_group_size_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8081 | +#endif | ||
| 8082 | } | ||
| 8083 | |||
| 8084 | kernel void bar1(global unsigned int *buf) | ||
| 8085 | { | ||
| 8086 | ndrange_t n; | ||
| 8087 | - buf[0] = get_kernel_sub_group_count_for_ndrange(n, ^(){}); // expected-error {{use of declaration 'get_kernel_sub_group_count_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8088 | + buf[0] = get_kernel_sub_group_count_for_ndrange(n, ^(){}); | ||
| 8089 | +#if __OPENCL_C_VERSION__ < 300 | ||
| 8090 | +// expected-error@-2 {{use of declaration 'get_kernel_sub_group_count_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8091 | +#endif | ||
| 8092 | } | ||
| 8093 | diff --git a/clang/test/SemaOpenCL/forget-unsupported-builtins.cl b/clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 8094 | new file mode 100644 | ||
| 8095 | index 000000000000..14dd03e2c7db | ||
| 8096 | --- /dev/null | ||
| 8097 | +++ b/clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 8098 | @@ -0,0 +1,22 @@ | ||
| 8099 | +// RUN: %clang_cc1 -cl-std=cl3.0 -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8100 | +// RUN: %clang_cc1 -cl-std=cl3.0 -fsyntax-only -cl-ext=__opencl_c_pipes,__opencl_c_generic_address_space,__opencl_c_device_enqueue -verify %s -triple spir-unknown-unknown -DFEATURES | ||
| 8101 | + | ||
| 8102 | +#ifndef FEATURES | ||
| 8103 | + // expected-no-diagnostics | ||
| 8104 | +#else | ||
| 8105 | + // expected-error@+10 {{cannot redeclare builtin function 'get_pipe_max_packets'}} | ||
| 8106 | + // expected-note@+9 {{'get_pipe_max_packets' is a builtin with type 'unsigned int ()'}} | ||
| 8107 | + // expected-error@+9 {{cannot redeclare builtin function 'to_local'}} | ||
| 8108 | + // expected-note@+8 {{'to_local' is a builtin with type 'void *(void *)'}} | ||
| 8109 | + // expected-error@+8 {{cannot redeclare builtin function 'to_global'}} | ||
| 8110 | + // expected-note@+7 {{'to_global' is a builtin with type 'void *(void *)'}} | ||
| 8111 | + // expected-error@+7 {{cannot redeclare builtin function 'get_kernel_work_group_size'}} | ||
| 8112 | + // expected-note@+6 {{'get_kernel_work_group_size' is a builtin with type 'unsigned int ()'}} | ||
| 8113 | +#endif | ||
| 8114 | + | ||
| 8115 | +int get_pipe_max_packets(int); | ||
| 8116 | +int to_local(int); | ||
| 8117 | +int to_global(int); | ||
| 8118 | +int get_kernel_work_group_size(int); | ||
| 8119 | + | ||
| 8120 | +kernel void test(global int *dst) {} | ||
| 8121 | diff --git a/clang/test/SemaOpenCL/image-features.cl b/clang/test/SemaOpenCL/image-features.cl | ||
| 8122 | new file mode 100644 | ||
| 8123 | index 000000000000..ace6913bb31e | ||
| 8124 | --- /dev/null | ||
| 8125 | +++ b/clang/test/SemaOpenCL/image-features.cl | ||
| 8126 | @@ -0,0 +1,20 @@ | ||
| 8127 | +// RUN: %clang_cc1 -cl-std=cl2.0 -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8128 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_images -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8129 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_3d_image_writes -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8130 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_read_write_images -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8131 | + | ||
| 8132 | +#if defined(__opencl_c_read_write_images) && defined(__opencl_c_3d_image_writes) | ||
| 8133 | + // expected-no-diagnostics | ||
| 8134 | +#endif | ||
| 8135 | + | ||
| 8136 | +__kernel void write_3d_image(__write_only image3d_t i) {} | ||
| 8137 | + | ||
| 8138 | +#ifndef __opencl_c_3d_image_writes | ||
| 8139 | + // expected-error@-3 {{use of type '__write_only image3d_t' requires __opencl_c_3d_image_writes extension to be enabled}} | ||
| 8140 | +#endif | ||
| 8141 | + | ||
| 8142 | +__kernel void read_write_3d_image(__read_write image3d_t i) { } | ||
| 8143 | + | ||
| 8144 | +#ifndef __opencl_c_read_write_images | ||
| 8145 | + // expected-error@-3 {{use of type '__read_write image3d_t' requires __opencl_c_read_write_images extension to be enabled}} | ||
| 8146 | +#endif | ||
| 8147 | diff --git a/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl b/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8148 | index 36e76621d24a..38b0a04726e3 100644 | ||
| 8149 | --- a/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8150 | +++ b/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8151 | @@ -1,4 +1,5 @@ | ||
| 8152 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_subgroups | ||
| 8153 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_subgroups,__opencl_c_pipes | ||
| 8154 | |||
| 8155 | #pragma OPENCL EXTENSION cl_khr_subgroups : enable | ||
| 8156 | |||
| 8157 | diff --git a/clang/test/SemaOpenCL/storageclass-cl20.cl b/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8158 | index 581701d2a6a5..469c526ebc30 100644 | ||
| 8159 | --- a/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8160 | +++ b/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8161 | @@ -1,4 +1,5 @@ | ||
| 8162 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 | ||
| 8163 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_program_scope_global_variables,__opencl_c_generic_address_space | ||
| 8164 | |||
| 8165 | int G2 = 0; | ||
| 8166 | global int G3 = 0; | ||
| 8167 | diff --git a/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp b/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8168 | index 41d33b550680..f50652493e5e 100644 | ||
| 8169 | --- a/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8170 | +++ b/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8171 | @@ -56,6 +56,7 @@ | ||
| 8172 | //===----------------------------------------------------------------------===// | ||
| 8173 | |||
| 8174 | #include "TableGenBackends.h" | ||
| 8175 | +#include "clang/Basic/OpenCLOptions.h" | ||
| 8176 | #include "llvm/ADT/MapVector.h" | ||
| 8177 | #include "llvm/ADT/STLExtras.h" | ||
| 8178 | #include "llvm/ADT/SmallString.h" | ||
| 8179 | @@ -69,6 +70,7 @@ | ||
| 8180 | #include "llvm/TableGen/Record.h" | ||
| 8181 | #include "llvm/TableGen/StringMatcher.h" | ||
| 8182 | #include "llvm/TableGen/TableGenBackend.h" | ||
| 8183 | +#include <numeric> | ||
| 8184 | #include <set> | ||
| 8185 | |||
| 8186 | using namespace llvm; | ||
| 8187 | @@ -228,6 +230,10 @@ private: | ||
| 8188 | // The function "tan", having the same signatures, would be mapped to the | ||
| 8189 | // same entry (<I1, I2, I3>). | ||
| 8190 | MapVector<BuiltinIndexListTy *, BuiltinTableEntries> SignatureListMap; | ||
| 8191 | + | ||
| 8192 | + // Encode all versions | ||
| 8193 | + unsigned short | ||
| 8194 | + EncodeBuiltinVersions(std::vector<Record *> BuiltinVersionsRecords) const; | ||
| 8195 | }; | ||
| 8196 | } // namespace | ||
| 8197 | |||
| 8198 | @@ -338,12 +344,10 @@ struct OpenCLBuiltinStruct { | ||
| 8199 | const bool IsConst; | ||
| 8200 | // Function attribute __attribute__((convergent)) | ||
| 8201 | const bool IsConv; | ||
| 8202 | + // All opencl versions encoded | ||
| 8203 | + const unsigned char AllVersions : 5; | ||
| 8204 | // OpenCL extension(s) required for this overload. | ||
| 8205 | const unsigned short Extension; | ||
| 8206 | - // First OpenCL version in which this overload was introduced (e.g. CL20). | ||
| 8207 | - const unsigned short MinVersion; | ||
| 8208 | - // First OpenCL version in which this overload was removed (e.g. CL20). | ||
| 8209 | - const unsigned short MaxVersion; | ||
| 8210 | }; | ||
| 8211 | |||
| 8212 | )"; | ||
| 8213 | @@ -503,11 +507,9 @@ void BuiltinNameEmitter::EmitBuiltinTable() { | ||
| 8214 | << (Overload.first->getValueAsBit("IsPure")) << ", " | ||
| 8215 | << (Overload.first->getValueAsBit("IsConst")) << ", " | ||
| 8216 | << (Overload.first->getValueAsBit("IsConv")) << ", " | ||
| 8217 | - << FunctionExtensionIndex[ExtName] << ", " | ||
| 8218 | - << Overload.first->getValueAsDef("MinVersion")->getValueAsInt("ID") | ||
| 8219 | - << ", " | ||
| 8220 | - << Overload.first->getValueAsDef("MaxVersion")->getValueAsInt("ID") | ||
| 8221 | - << " },\n"; | ||
| 8222 | + << EncodeBuiltinVersions( | ||
| 8223 | + Overload.first->getValueAsListOfDefs("Versions")) | ||
| 8224 | + << ", " << FunctionExtensionIndex[ExtName] << " },\n"; | ||
| 8225 | Index++; | ||
| 8226 | } | ||
| 8227 | } | ||
| 8228 | @@ -528,10 +530,8 @@ bool BuiltinNameEmitter::CanReuseSignature( | ||
| 8229 | if (Rec->getValueAsBit("IsPure") == Rec2->getValueAsBit("IsPure") && | ||
| 8230 | Rec->getValueAsBit("IsConst") == Rec2->getValueAsBit("IsConst") && | ||
| 8231 | Rec->getValueAsBit("IsConv") == Rec2->getValueAsBit("IsConv") && | ||
| 8232 | - Rec->getValueAsDef("MinVersion")->getValueAsInt("ID") == | ||
| 8233 | - Rec2->getValueAsDef("MinVersion")->getValueAsInt("ID") && | ||
| 8234 | - Rec->getValueAsDef("MaxVersion")->getValueAsInt("ID") == | ||
| 8235 | - Rec2->getValueAsDef("MaxVersion")->getValueAsInt("ID") && | ||
| 8236 | + EncodeBuiltinVersions(Rec->getValueAsListOfDefs("Versions")) == | ||
| 8237 | + EncodeBuiltinVersions(Rec2->getValueAsListOfDefs("Versions")) && | ||
| 8238 | Rec->getValueAsDef("Extension")->getName() == | ||
| 8239 | Rec2->getValueAsDef("Extension")->getName()) { | ||
| 8240 | return true; | ||
| 8241 | @@ -806,6 +806,15 @@ static void OCL2Qual(ASTContext &Context, const OpenCLTypeStruct &Ty, | ||
| 8242 | OS << "\n} // OCL2Qual\n"; | ||
| 8243 | } | ||
| 8244 | |||
| 8245 | +unsigned short BuiltinNameEmitter::EncodeBuiltinVersions( | ||
| 8246 | + std::vector<Record *> BuiltinVersionsRecords) const { | ||
| 8247 | + return std::accumulate( | ||
| 8248 | + BuiltinVersionsRecords.begin(), BuiltinVersionsRecords.end(), | ||
| 8249 | + (unsigned short)0, [](unsigned short C, Record *R) { | ||
| 8250 | + return C |= clang::OpenCLOptions::EncodeVersion(R->getValueAsInt("ID")); | ||
| 8251 | + }); | ||
| 8252 | +} | ||
| 8253 | + | ||
| 8254 | void clang::EmitClangOpenCLBuiltins(RecordKeeper &Records, raw_ostream &OS) { | ||
| 8255 | BuiltinNameEmitter NameChecker(Records, OS); | ||
| 8256 | NameChecker.Emit(); | ||
| 8257 | -- | ||
| 8258 | 2.17.1 | ||
| 8259 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-Remove-repo-name-in-LLVM-IR.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-Remove-repo-name-in-LLVM-IR.patch deleted file mode 100644 index 232ae063..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-Remove-repo-name-in-LLVM-IR.patch +++ /dev/null | |||
| @@ -1,50 +0,0 @@ | |||
| 1 | From b53fd86ffdeacb9b13624bdb110fd25e8c35cb92 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Feng Zou <feng.zou@intel.com> | ||
| 3 | Date: Mon, 19 Oct 2020 14:43:38 +0800 | ||
| 4 | Subject: [PATCH] Remove repo name in LLVM IR | ||
| 5 | |||
| 6 | Upstream-Status: Backport [Taken from opencl-clang patches, https://github.com/intel/opencl-clang/blob/ocl-open-100/patches/llvm/0003-Remove-repo-name-in-LLVM-IR.patch] | ||
| 7 | Signed-off-by: Feng Zou <feng.zou@intel.com> | ||
| 8 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 9 | |||
| 10 | --- | ||
| 11 | llvm/cmake/modules/VersionFromVCS.cmake | 23 ++++++++++++----------- | ||
| 12 | 1 file changed, 12 insertions(+), 11 deletions(-) | ||
| 13 | |||
| 14 | diff --git a/llvm/cmake/modules/VersionFromVCS.cmake b/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 15 | index 1b6519b4b7c..8fd6b23bb34 100644 | ||
| 16 | --- a/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 17 | +++ b/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 18 | @@ -33,17 +33,18 @@ function(get_source_info path revision repository) | ||
| 19 | else() | ||
| 20 | set(remote "origin") | ||
| 21 | endif() | ||
| 22 | - execute_process(COMMAND ${GIT_EXECUTABLE} remote get-url ${remote} | ||
| 23 | - WORKING_DIRECTORY ${path} | ||
| 24 | - RESULT_VARIABLE git_result | ||
| 25 | - OUTPUT_VARIABLE git_output | ||
| 26 | - ERROR_QUIET) | ||
| 27 | - if(git_result EQUAL 0) | ||
| 28 | - string(STRIP "${git_output}" git_output) | ||
| 29 | - set(${repository} ${git_output} PARENT_SCOPE) | ||
| 30 | - else() | ||
| 31 | - set(${repository} ${path} PARENT_SCOPE) | ||
| 32 | - endif() | ||
| 33 | + # Do not show repo name in IR | ||
| 34 | + # execute_process(COMMAND ${GIT_EXECUTABLE} remote get-url ${remote} | ||
| 35 | + # WORKING_DIRECTORY ${path} | ||
| 36 | + # RESULT_VARIABLE git_result | ||
| 37 | + # OUTPUT_VARIABLE git_output | ||
| 38 | + # ERROR_QUIET) | ||
| 39 | + # if(git_result EQUAL 0) | ||
| 40 | + # string(STRIP "${git_output}" git_output) | ||
| 41 | + # set(${repository} ${git_output} PARENT_SCOPE) | ||
| 42 | + # else() | ||
| 43 | + # set(${repository} ${path} PARENT_SCOPE) | ||
| 44 | + # endif() | ||
| 45 | endif() | ||
| 46 | endif() | ||
| 47 | endfunction() | ||
| 48 | -- | ||
| 49 | 2.18.1 | ||
| 50 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-skip-building-tests.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-skip-building-tests.patch deleted file mode 100644 index 8e58ec25..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm10-skip-building-tests.patch +++ /dev/null | |||
| @@ -1,51 +0,0 @@ | |||
| 1 | From 455ce9c25df5313f4a6649cc27075bdfbe25af18 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 3 | Date: Wed, 21 Aug 2019 14:35:31 +0800 | ||
| 4 | Subject: [PATCH] llvm-spirv: skip building tests | ||
| 5 | |||
| 6 | Some of these need clang to be built and since we're building this in-tree, | ||
| 7 | that leads to problems when compiling libcxx, compiler-rt which aren't built | ||
| 8 | in-tree. | ||
| 9 | |||
| 10 | Instead of using SPIRV_SKIP_CLANG_BUILD to skip clang build and adding this to | ||
| 11 | all components, disable the building of tests altogether. | ||
| 12 | |||
| 13 | Upstream-Status: Inappropriate | ||
| 14 | |||
| 15 | Signed-off-by: Anuj Mittal <anuj.mittal@intel.com> | ||
| 16 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 17 | --- | ||
| 18 | CMakeLists.txt | 10 ---------- | ||
| 19 | 1 file changed, 10 deletions(-) | ||
| 20 | |||
| 21 | diff --git a/CMakeLists.txt b/CMakeLists.txt | ||
| 22 | index b718c00..9805140 100644 | ||
| 23 | --- a/CMakeLists.txt | ||
| 24 | +++ b/CMakeLists.txt | ||
| 25 | @@ -24,13 +24,6 @@ if(LLVM_SPIRV_BUILD_EXTERNAL) | ||
| 26 | set(CMAKE_CXX_STANDARD 14) | ||
| 27 | set(CMAKE_CXX_STANDARD_REQUIRED ON) | ||
| 28 | |||
| 29 | - if(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 30 | - set(LLVM_TEST_COMPONENTS | ||
| 31 | - llvm-as | ||
| 32 | - llvm-dis | ||
| 33 | - ) | ||
| 34 | - endif(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 35 | - | ||
| 36 | find_package(LLVM 10.0.0 REQUIRED | ||
| 37 | COMPONENTS | ||
| 38 | Analysis | ||
| 39 | @@ -61,9 +54,6 @@ set(LLVM_SPIRV_INCLUDE_DIRS ${CMAKE_CURRENT_SOURCE_DIR}/include) | ||
| 40 | |||
| 41 | add_subdirectory(lib/SPIRV) | ||
| 42 | add_subdirectory(tools/llvm-spirv) | ||
| 43 | -if(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 44 | - add_subdirectory(test) | ||
| 45 | -endif(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 46 | |||
| 47 | install( | ||
| 48 | FILES | ||
| 49 | -- | ||
| 50 | 2.7.4 | ||
| 51 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-OpenCL-3.0-support.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-OpenCL-3.0-support.patch deleted file mode 100644 index 98545db0..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-OpenCL-3.0-support.patch +++ /dev/null | |||
| @@ -1,8453 +0,0 @@ | |||
| 1 | From d767afa79d1c8153081eac1ef33e348cadbea5bb Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Anton Zabaznov <anton.zabaznov@intel.com> | ||
| 3 | Date: Tue, 22 Sep 2020 19:03:50 +0300 | ||
| 4 | Subject: [PATCH] OpenCL 3.0 support | ||
| 5 | |||
| 6 | Upstream-Status: Backport [Taken from opencl-clang patches, https://github.com/intel/opencl-clang/blob/ocl-open-110/patches/clang/0001-OpenCL-3.0-support.patch] | ||
| 7 | Signed-off-by: Anton Zabaznov <anton.zabaznov@intel.com> | ||
| 8 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 9 | |||
| 10 | |||
| 11 | --- | ||
| 12 | clang/include/clang/Basic/Builtins.def | 65 +- | ||
| 13 | clang/include/clang/Basic/Builtins.h | 13 +- | ||
| 14 | .../clang/Basic/DiagnosticParseKinds.td | 2 + | ||
| 15 | .../clang/Basic/DiagnosticSemaKinds.td | 7 + | ||
| 16 | clang/include/clang/Basic/LangOptions.def | 2 + | ||
| 17 | clang/include/clang/Basic/LangStandards.def | 4 + | ||
| 18 | .../include/clang/Basic/OpenCLExtensions.def | 15 + | ||
| 19 | clang/include/clang/Basic/OpenCLOptions.h | 174 +- | ||
| 20 | clang/include/clang/Driver/Options.td | 2 +- | ||
| 21 | clang/include/clang/Sema/Sema.h | 9 + | ||
| 22 | clang/lib/AST/ASTContext.cpp | 3 +- | ||
| 23 | clang/lib/Basic/Builtins.cpp | 28 +- | ||
| 24 | clang/lib/Basic/TargetInfo.cpp | 11 + | ||
| 25 | clang/lib/Basic/Targets.cpp | 1 - | ||
| 26 | clang/lib/CodeGen/CodeGenFunction.cpp | 6 +- | ||
| 27 | clang/lib/Frontend/CompilerInvocation.cpp | 22 +- | ||
| 28 | clang/lib/Frontend/InitPreprocessor.cpp | 6 +- | ||
| 29 | clang/lib/Headers/opencl-c-base.h | 75 +- | ||
| 30 | clang/lib/Headers/opencl-c.h | 3216 ++++++++++++++--- | ||
| 31 | clang/lib/Parse/ParseDecl.cpp | 12 +- | ||
| 32 | clang/lib/Parse/ParsePragma.cpp | 10 +- | ||
| 33 | clang/lib/Sema/OpenCLBuiltins.td | 153 +- | ||
| 34 | clang/lib/Sema/Sema.cpp | 47 +- | ||
| 35 | clang/lib/Sema/SemaChecking.cpp | 38 +- | ||
| 36 | clang/lib/Sema/SemaDecl.cpp | 18 +- | ||
| 37 | clang/lib/Sema/SemaDeclAttr.cpp | 9 +- | ||
| 38 | clang/lib/Sema/SemaDeclCXX.cpp | 12 +- | ||
| 39 | clang/lib/Sema/SemaLookup.cpp | 19 +- | ||
| 40 | clang/lib/Sema/SemaType.cpp | 14 +- | ||
| 41 | .../CodeGenOpenCL/addr-space-struct-arg.cl | 7 +- | ||
| 42 | .../address-spaces-conversions.cl | 2 + | ||
| 43 | .../CodeGenOpenCL/address-spaces-mangling.cl | 3 +- | ||
| 44 | clang/test/CodeGenOpenCL/address-spaces.cl | 4 + | ||
| 45 | .../amdgcn-automatic-variable.cl | 1 + | ||
| 46 | .../CodeGenOpenCL/amdgpu-sizeof-alignof.cl | 21 +- | ||
| 47 | .../CodeGenOpenCL/arm-integer-dot-product.cl | 1 + | ||
| 48 | .../test/CodeGenOpenCL/cl-uniform-wg-size.cl | 2 + | ||
| 49 | clang/test/CodeGenOpenCL/fpmath.cl | 2 + | ||
| 50 | .../generic-address-space-feature.cl | 28 + | ||
| 51 | .../intel-subgroups-avc-ext-types.cl | 1 + | ||
| 52 | .../kernels-have-spir-cc-by-default.cl | 3 + | ||
| 53 | clang/test/CodeGenOpenCL/logical-ops.cl | 1 + | ||
| 54 | clang/test/CodeGenOpenCL/no-half.cl | 1 + | ||
| 55 | clang/test/CodeGenOpenCL/pipe_builtin.cl | 3 + | ||
| 56 | clang/test/CodeGenOpenCL/pipe_types.cl | 1 + | ||
| 57 | clang/test/CodeGenOpenCL/printf.cl | 2 + | ||
| 58 | clang/test/CodeGenOpenCL/unroll-hint.cl | 1 + | ||
| 59 | clang/test/Driver/autocomplete.c | 2 + | ||
| 60 | clang/test/Driver/opencl.cl | 2 + | ||
| 61 | clang/test/Driver/unknown-std.cl | 1 + | ||
| 62 | clang/test/Frontend/stdlang.c | 1 + | ||
| 63 | clang/test/Headers/opencl-c-header.cl | 7 +- | ||
| 64 | clang/test/Index/pipe-size.cl | 7 + | ||
| 65 | clang/test/Preprocessor/init-aarch64.c | 12 +- | ||
| 66 | clang/test/Preprocessor/predefined-macros.c | 13 + | ||
| 67 | .../Sema/feature-extensions-simult-support.cl | 75 + | ||
| 68 | clang/test/Sema/features-ignore-pragma.cl | 24 + | ||
| 69 | clang/test/Sema/opencl-features-pipes.cl | 18 + | ||
| 70 | clang/test/Sema/opencl-features.cl | 128 + | ||
| 71 | clang/test/Sema/pipe_builtins_feature.cl | 21 + | ||
| 72 | .../address-spaces-conversions-cl2.0.cl | 3 + | ||
| 73 | clang/test/SemaOpenCL/address-spaces.cl | 1 + | ||
| 74 | .../SemaOpenCL/cl20-device-side-enqueue.cl | 16 +- | ||
| 75 | .../SemaOpenCL/forget-unsupported-builtins.cl | 22 + | ||
| 76 | clang/test/SemaOpenCL/image-features.cl | 20 + | ||
| 77 | .../SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | 1 + | ||
| 78 | clang/test/SemaOpenCL/storageclass-cl20.cl | 1 + | ||
| 79 | .../TableGen/ClangOpenCLBuiltinEmitter.cpp | 35 +- | ||
| 80 | 68 files changed, 3749 insertions(+), 738 deletions(-) | ||
| 81 | create mode 100644 clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 82 | create mode 100644 clang/test/Sema/feature-extensions-simult-support.cl | ||
| 83 | create mode 100644 clang/test/Sema/features-ignore-pragma.cl | ||
| 84 | create mode 100644 clang/test/Sema/opencl-features-pipes.cl | ||
| 85 | create mode 100644 clang/test/Sema/opencl-features.cl | ||
| 86 | create mode 100644 clang/test/Sema/pipe_builtins_feature.cl | ||
| 87 | create mode 100644 clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 88 | create mode 100644 clang/test/SemaOpenCL/image-features.cl | ||
| 89 | |||
| 90 | diff --git a/clang/include/clang/Basic/Builtins.def b/clang/include/clang/Basic/Builtins.def | ||
| 91 | index 5463b7dfc18c..e094beab9a6c 100644 | ||
| 92 | --- a/clang/include/clang/Basic/Builtins.def | ||
| 93 | +++ b/clang/include/clang/Basic/Builtins.def | ||
| 94 | @@ -111,6 +111,10 @@ | ||
| 95 | # define LANGBUILTIN(ID, TYPE, ATTRS, BUILTIN_LANG) BUILTIN(ID, TYPE, ATTRS) | ||
| 96 | #endif | ||
| 97 | |||
| 98 | +#if defined(BUILTIN) && !defined(OPENCLBUILTIN) | ||
| 99 | +# define OPENCLBUILTIN(ID, TYPE, ATTRS, BUILTIN_LANG, FEATURE) BUILTIN(ID, TYPE, ATTRS) | ||
| 100 | +#endif | ||
| 101 | + | ||
| 102 | // Standard libc/libm functions: | ||
| 103 | BUILTIN(__builtin_atan2 , "ddd" , "Fne") | ||
| 104 | BUILTIN(__builtin_atan2f, "fff" , "Fne") | ||
| 105 | @@ -1529,50 +1533,54 @@ BUILTIN(__builtin_coro_param, "bv*v*", "n") | ||
| 106 | |||
| 107 | // OpenCL v2.0 s6.13.16, s9.17.3.5 - Pipe functions. | ||
| 108 | // We need the generic prototype, since the packet type could be anything. | ||
| 109 | -LANGBUILTIN(read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 110 | -LANGBUILTIN(write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 111 | +OPENCLBUILTIN(read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 112 | +OPENCLBUILTIN(write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 113 | |||
| 114 | -LANGBUILTIN(reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 115 | -LANGBUILTIN(reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 116 | +OPENCLBUILTIN(reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 117 | +OPENCLBUILTIN(reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 118 | |||
| 119 | -LANGBUILTIN(commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 120 | -LANGBUILTIN(commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 121 | +OPENCLBUILTIN(commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 122 | +OPENCLBUILTIN(commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 123 | |||
| 124 | -LANGBUILTIN(sub_group_reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 125 | -LANGBUILTIN(sub_group_reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 126 | +OPENCLBUILTIN(sub_group_reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 127 | +OPENCLBUILTIN(sub_group_reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 128 | |||
| 129 | -LANGBUILTIN(sub_group_commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 130 | -LANGBUILTIN(sub_group_commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 131 | +OPENCLBUILTIN(sub_group_commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 132 | +OPENCLBUILTIN(sub_group_commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 133 | |||
| 134 | -LANGBUILTIN(work_group_reserve_read_pipe, "i.", "tn", OCLC20_LANG) | ||
| 135 | -LANGBUILTIN(work_group_reserve_write_pipe, "i.", "tn", OCLC20_LANG) | ||
| 136 | +OPENCLBUILTIN(work_group_reserve_read_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 137 | +OPENCLBUILTIN(work_group_reserve_write_pipe, "i.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 138 | |||
| 139 | -LANGBUILTIN(work_group_commit_read_pipe, "v.", "tn", OCLC20_LANG) | ||
| 140 | -LANGBUILTIN(work_group_commit_write_pipe, "v.", "tn", OCLC20_LANG) | ||
| 141 | +OPENCLBUILTIN(work_group_commit_read_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 142 | +OPENCLBUILTIN(work_group_commit_write_pipe, "v.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 143 | |||
| 144 | -LANGBUILTIN(get_pipe_num_packets, "Ui.", "tn", OCLC20_LANG) | ||
| 145 | -LANGBUILTIN(get_pipe_max_packets, "Ui.", "tn", OCLC20_LANG) | ||
| 146 | +OPENCLBUILTIN(get_pipe_num_packets, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 147 | +OPENCLBUILTIN(get_pipe_max_packets, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_pipes") | ||
| 148 | |||
| 149 | // OpenCL v2.0 s6.13.17 - Enqueue kernel functions. | ||
| 150 | // Custom builtin check allows to perform special check of passed block arguments. | ||
| 151 | -LANGBUILTIN(enqueue_kernel, "i.", "tn", OCLC20_LANG) | ||
| 152 | -LANGBUILTIN(get_kernel_work_group_size, "Ui.", "tn", OCLC20_LANG) | ||
| 153 | -LANGBUILTIN(get_kernel_preferred_work_group_size_multiple, "Ui.", "tn", OCLC20_LANG) | ||
| 154 | -LANGBUILTIN(get_kernel_max_sub_group_size_for_ndrange, "Ui.", "tn", OCLC20_LANG) | ||
| 155 | -LANGBUILTIN(get_kernel_sub_group_count_for_ndrange, "Ui.", "tn", OCLC20_LANG) | ||
| 156 | +OPENCLBUILTIN(enqueue_kernel, "i.", "tn", OCLC2P_LANG, | ||
| 157 | + "__opencl_c_device_enqueue") | ||
| 158 | +OPENCLBUILTIN(get_kernel_work_group_size, "Ui.", "tn", OCLC2P_LANG, | ||
| 159 | + "__opencl_c_device_enqueue") | ||
| 160 | +OPENCLBUILTIN(get_kernel_preferred_work_group_size_multiple, "Ui.", "tn", | ||
| 161 | + OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 162 | +OPENCLBUILTIN(get_kernel_max_sub_group_size_for_ndrange, "Ui.", "tn", | ||
| 163 | + OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 164 | +OPENCLBUILTIN(get_kernel_sub_group_count_for_ndrange, "Ui.", "tn", OCLC2P_LANG, "__opencl_c_device_enqueue") | ||
| 165 | |||
| 166 | // OpenCL v2.0 s6.13.9 - Address space qualifier functions. | ||
| 167 | // FIXME: Pointer parameters of OpenCL builtins should have their address space | ||
| 168 | // requirement defined. | ||
| 169 | -LANGBUILTIN(to_global, "v*v*", "tn", OCLC20_LANG) | ||
| 170 | -LANGBUILTIN(to_local, "v*v*", "tn", OCLC20_LANG) | ||
| 171 | -LANGBUILTIN(to_private, "v*v*", "tn", OCLC20_LANG) | ||
| 172 | +OPENCLBUILTIN(to_global, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 173 | +OPENCLBUILTIN(to_local, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 174 | +OPENCLBUILTIN(to_private, "v*v*", "tn", OCLC2P_LANG, "__opencl_c_generic_address_space") | ||
| 175 | |||
| 176 | // OpenCL half load/store builtin | ||
| 177 | -LANGBUILTIN(__builtin_store_half, "vdh*", "n", ALL_OCLC_LANGUAGES) | ||
| 178 | -LANGBUILTIN(__builtin_store_halff, "vfh*", "n", ALL_OCLC_LANGUAGES) | ||
| 179 | -LANGBUILTIN(__builtin_load_half, "dhC*", "nc", ALL_OCLC_LANGUAGES) | ||
| 180 | -LANGBUILTIN(__builtin_load_halff, "fhC*", "nc", ALL_OCLC_LANGUAGES) | ||
| 181 | +OPENCLBUILTIN(__builtin_store_half, "vdh*", "n", ALL_OCLC_LANGUAGES, "") | ||
| 182 | +OPENCLBUILTIN(__builtin_store_halff, "vfh*", "n", ALL_OCLC_LANGUAGES, "") | ||
| 183 | +OPENCLBUILTIN(__builtin_load_half, "dhC*", "nc", ALL_OCLC_LANGUAGES, "") | ||
| 184 | +OPENCLBUILTIN(__builtin_load_halff, "fhC*", "nc", ALL_OCLC_LANGUAGES, "") | ||
| 185 | |||
| 186 | // Builtins for os_log/os_trace | ||
| 187 | BUILTIN(__builtin_os_log_format_buffer_size, "zcC*.", "p:0:nut") | ||
| 188 | @@ -1593,3 +1601,4 @@ BUILTIN(__builtin_ms_va_copy, "vc*&c*&", "n") | ||
| 189 | #undef BUILTIN | ||
| 190 | #undef LIBBUILTIN | ||
| 191 | #undef LANGBUILTIN | ||
| 192 | +#undef OPENCLBUILTIN | ||
| 193 | diff --git a/clang/include/clang/Basic/Builtins.h b/clang/include/clang/Basic/Builtins.h | ||
| 194 | index 15bfcf797917..ba3e7853444c 100644 | ||
| 195 | --- a/clang/include/clang/Basic/Builtins.h | ||
| 196 | +++ b/clang/include/clang/Basic/Builtins.h | ||
| 197 | @@ -33,13 +33,13 @@ enum LanguageID { | ||
| 198 | CXX_LANG = 0x4, // builtin for cplusplus only. | ||
| 199 | OBJC_LANG = 0x8, // builtin for objective-c and objective-c++ | ||
| 200 | MS_LANG = 0x10, // builtin requires MS mode. | ||
| 201 | - OCLC20_LANG = 0x20, // builtin for OpenCL C 2.0 only. | ||
| 202 | + OCLC2P_LANG = 0x20, // builtin for OpenCL C 2.0+ versions. | ||
| 203 | OCLC1X_LANG = 0x40, // builtin for OpenCL C 1.x only. | ||
| 204 | OMP_LANG = 0x80, // builtin requires OpenMP. | ||
| 205 | ALL_LANGUAGES = C_LANG | CXX_LANG | OBJC_LANG, // builtin for all languages. | ||
| 206 | ALL_GNU_LANGUAGES = ALL_LANGUAGES | GNU_LANG, // builtin requires GNU mode. | ||
| 207 | ALL_MS_LANGUAGES = ALL_LANGUAGES | MS_LANG, // builtin requires MS mode. | ||
| 208 | - ALL_OCLC_LANGUAGES = OCLC1X_LANG | OCLC20_LANG // builtin for OCLC languages. | ||
| 209 | + ALL_OCLC_LANGUAGES = OCLC1X_LANG | OCLC2P_LANG // builtin for OCLC languages. | ||
| 210 | }; | ||
| 211 | |||
| 212 | namespace Builtin { | ||
| 213 | @@ -235,6 +235,10 @@ public: | ||
| 214 | /// for non-builtins. | ||
| 215 | bool canBeRedeclared(unsigned ID) const; | ||
| 216 | |||
| 217 | + bool requiresFeatures(unsigned ID) const { | ||
| 218 | + return requiresFeatures(getRecord(ID)); | ||
| 219 | + } | ||
| 220 | + | ||
| 221 | private: | ||
| 222 | const Info &getRecord(unsigned ID) const; | ||
| 223 | |||
| 224 | @@ -242,6 +246,11 @@ private: | ||
| 225 | bool builtinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 226 | const LangOptions &LangOpts); | ||
| 227 | |||
| 228 | + bool OclBuiltinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 229 | + const LangOptions &LangOpts) const; | ||
| 230 | + | ||
| 231 | + bool requiresFeatures(const Builtin::Info &BuiltinInfo) const; | ||
| 232 | + | ||
| 233 | /// Helper function for isPrintfLike and isScanfLike. | ||
| 234 | bool isLike(unsigned ID, unsigned &FormatIdx, bool &HasVAListArg, | ||
| 235 | const char *Fmt) const; | ||
| 236 | diff --git a/clang/include/clang/Basic/DiagnosticParseKinds.td b/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 237 | index 1038a4119d4c..ba1b1b67a131 100644 | ||
| 238 | --- a/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 239 | +++ b/clang/include/clang/Basic/DiagnosticParseKinds.td | ||
| 240 | @@ -1206,6 +1206,8 @@ def warn_pragma_unsupported_extension : Warning< | ||
| 241 | "unsupported OpenCL extension %0 - ignoring">, InGroup<IgnoredPragmas>; | ||
| 242 | def warn_pragma_extension_is_core : Warning< | ||
| 243 | "OpenCL extension %0 is core feature or supported optional core feature - ignoring">, InGroup<DiagGroup<"pedantic-core-features">>, DefaultIgnore; | ||
| 244 | +def warn_opencl_pragma_feature_ignore : Warning< | ||
| 245 | + "OpenCL feature support can't be controlled via pragma, ignoring">, InGroup<IgnoredPragmas>; | ||
| 246 | |||
| 247 | // OpenCL errors. | ||
| 248 | def err_opencl_taking_function_address_parser : Error< | ||
| 249 | diff --git a/clang/include/clang/Basic/DiagnosticSemaKinds.td b/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 250 | index 941f2cafc372..aa9e8b7b011b 100644 | ||
| 251 | --- a/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 252 | +++ b/clang/include/clang/Basic/DiagnosticSemaKinds.td | ||
| 253 | @@ -9741,6 +9741,13 @@ def ext_opencl_ext_vector_type_rgba_selector: ExtWarn< | ||
| 254 | def err_openclcxx_placement_new : Error< | ||
| 255 | "use of placement new requires explicit declaration">; | ||
| 256 | |||
| 257 | +def err_opencl_pipes_require_feat : Error< | ||
| 258 | + "usage of OpenCL pipes requires feature support">; | ||
| 259 | +def err_opencl_memory_scope_require_feat : Error< | ||
| 260 | + "usage of memory scope requires feature support">; | ||
| 261 | +def err_opencl_memory_ordering_require_feat : Error< | ||
| 262 | + "usage of memory ordering requires feature support">; | ||
| 263 | + | ||
| 264 | // MIG routine annotations. | ||
| 265 | def warn_mig_server_routine_does_not_return_kern_return_t : Warning< | ||
| 266 | "'mig_server_routine' attribute only applies to routines that return a kern_return_t">, | ||
| 267 | diff --git a/clang/include/clang/Basic/LangOptions.def b/clang/include/clang/Basic/LangOptions.def | ||
| 268 | index 70f68d664bb7..e683f5956975 100644 | ||
| 269 | --- a/clang/include/clang/Basic/LangOptions.def | ||
| 270 | +++ b/clang/include/clang/Basic/LangOptions.def | ||
| 271 | @@ -215,6 +215,8 @@ LANGOPT(OpenCL , 1, 0, "OpenCL") | ||
| 272 | LANGOPT(OpenCLVersion , 32, 0, "OpenCL C version") | ||
| 273 | LANGOPT(OpenCLCPlusPlus , 1, 0, "C++ for OpenCL") | ||
| 274 | LANGOPT(OpenCLCPlusPlusVersion , 32, 0, "C++ for OpenCL version") | ||
| 275 | +LANGOPT(OpenCLGenericKeyword , 1, 0, "OpenCL generic keyword") | ||
| 276 | +LANGOPT(OpenCLPipeKeyword , 1, 0, "OpenCL pipe keyword") | ||
| 277 | LANGOPT(NativeHalfType , 1, 0, "Native half type support") | ||
| 278 | LANGOPT(NativeHalfArgsAndReturns, 1, 0, "Native half args and returns") | ||
| 279 | LANGOPT(HalfArgsAndReturns, 1, 0, "half args and returns") | ||
| 280 | diff --git a/clang/include/clang/Basic/LangStandards.def b/clang/include/clang/Basic/LangStandards.def | ||
| 281 | index b09568e8b3e8..7b915c312746 100644 | ||
| 282 | --- a/clang/include/clang/Basic/LangStandards.def | ||
| 283 | +++ b/clang/include/clang/Basic/LangStandards.def | ||
| 284 | @@ -167,6 +167,9 @@ LANGSTANDARD(opencl12, "cl1.2", | ||
| 285 | LANGSTANDARD(opencl20, "cl2.0", | ||
| 286 | OpenCL, "OpenCL 2.0", | ||
| 287 | LineComment | C99 | Digraphs | HexFloat | OpenCL) | ||
| 288 | +LANGSTANDARD(opencl30, "cl3.0", | ||
| 289 | + OpenCL, "OpenCL 3.0", | ||
| 290 | + LineComment | C99 | Digraphs | HexFloat | OpenCL) | ||
| 291 | LANGSTANDARD(openclcpp, "clc++", | ||
| 292 | OpenCL, "C++ for OpenCL", | ||
| 293 | LineComment | CPlusPlus | CPlusPlus11 | CPlusPlus14 | CPlusPlus17 | | ||
| 294 | @@ -176,6 +179,7 @@ LANGSTANDARD_ALIAS_DEPR(opencl10, "CL") | ||
| 295 | LANGSTANDARD_ALIAS_DEPR(opencl11, "CL1.1") | ||
| 296 | LANGSTANDARD_ALIAS_DEPR(opencl12, "CL1.2") | ||
| 297 | LANGSTANDARD_ALIAS_DEPR(opencl20, "CL2.0") | ||
| 298 | +LANGSTANDARD_ALIAS_DEPR(opencl30, "CL3.0") | ||
| 299 | LANGSTANDARD_ALIAS_DEPR(openclcpp, "CLC++") | ||
| 300 | |||
| 301 | // CUDA | ||
| 302 | diff --git a/clang/include/clang/Basic/OpenCLExtensions.def b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 303 | index 1ae36b32fb0a..d1574164f9b2 100644 | ||
| 304 | --- a/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 305 | +++ b/clang/include/clang/Basic/OpenCLExtensions.def | ||
| 306 | @@ -100,6 +100,21 @@ OPENCLEXT_INTERNAL(cl_intel_subgroups, 120, ~0U) | ||
| 307 | OPENCLEXT_INTERNAL(cl_intel_subgroups_short, 120, ~0U) | ||
| 308 | OPENCLEXT_INTERNAL(cl_intel_device_side_avc_motion_estimation, 120, ~0U) | ||
| 309 | |||
| 310 | +OPENCLEXT_INTERNAL(__opencl_c_pipes, 200, ~0U) | ||
| 311 | +OPENCLEXT_INTERNAL(__opencl_c_generic_address_space, 200, ~0U) | ||
| 312 | +OPENCLEXT_INTERNAL(__opencl_c_work_group_collective_functions, 200, ~0U) | ||
| 313 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_order_acq_rel, 200, ~0U) | ||
| 314 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_order_seq_cst, 200, ~0U) | ||
| 315 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_scope_device, 200, ~0U) | ||
| 316 | +OPENCLEXT_INTERNAL(__opencl_c_atomic_scope_all_devices, 200, ~0U) | ||
| 317 | +OPENCLEXT_INTERNAL(__opencl_c_subgroups, 200, ~0U) | ||
| 318 | +OPENCLEXT_INTERNAL(__opencl_c_3d_image_writes, 100, ~0U) | ||
| 319 | +OPENCLEXT_INTERNAL(__opencl_c_device_enqueue, 200, ~0U) | ||
| 320 | +OPENCLEXT_INTERNAL(__opencl_c_read_write_images, 200, ~0U) | ||
| 321 | +OPENCLEXT_INTERNAL(__opencl_c_program_scope_global_variables, 200, ~0U) | ||
| 322 | +OPENCLEXT_INTERNAL(__opencl_c_fp64, 120, ~0U) | ||
| 323 | +OPENCLEXT_INTERNAL(__opencl_c_int64, 100, ~0U) | ||
| 324 | +OPENCLEXT_INTERNAL(__opencl_c_images, 100, ~0U) | ||
| 325 | #undef OPENCLEXT_INTERNAL | ||
| 326 | |||
| 327 | #ifdef OPENCLEXT | ||
| 328 | diff --git a/clang/include/clang/Basic/OpenCLOptions.h b/clang/include/clang/Basic/OpenCLOptions.h | ||
| 329 | index 15661154eab5..d5800f5611c6 100644 | ||
| 330 | --- a/clang/include/clang/Basic/OpenCLOptions.h | ||
| 331 | +++ b/clang/include/clang/Basic/OpenCLOptions.h | ||
| 332 | @@ -21,6 +21,10 @@ namespace clang { | ||
| 333 | |||
| 334 | /// OpenCL supported extensions and optional core features | ||
| 335 | class OpenCLOptions { | ||
| 336 | + // OpenCL Version | ||
| 337 | + unsigned CLVer = 120; | ||
| 338 | + bool IsOpenCLCPlusPlus = false; | ||
| 339 | + | ||
| 340 | struct Info { | ||
| 341 | bool Supported; // Is this option supported | ||
| 342 | bool Enabled; // Is this option enabled | ||
| 343 | @@ -31,7 +35,38 @@ class OpenCLOptions { | ||
| 344 | :Supported(S), Enabled(E), Avail(A), Core(C){} | ||
| 345 | }; | ||
| 346 | llvm::StringMap<Info> OptMap; | ||
| 347 | + | ||
| 348 | public: | ||
| 349 | + void setOpenCLVersion(const LangOptions &LO) { | ||
| 350 | + IsOpenCLCPlusPlus = LO.OpenCLCPlusPlus; | ||
| 351 | + CLVer = IsOpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 352 | + } | ||
| 353 | + | ||
| 354 | + // Get extension which is semantically equivalent to a given feature | ||
| 355 | + // if exists (e.g. __opencl_c_subgroups -> cl_khr_subgroups) | ||
| 356 | + llvm::Optional<StringRef> getEquivalentExtension(StringRef Feature) const { | ||
| 357 | + return llvm::StringSwitch<llvm::Optional<StringRef>>(Feature) | ||
| 358 | + .Case("__opencl_c_3d_image_writes", | ||
| 359 | + Optional<StringRef>("cl_khr_3d_image_writes")) | ||
| 360 | + .Case("__opencl_c_subgroups", Optional<StringRef>("cl_khr_subgroups")) | ||
| 361 | + .Case("__opencl_c_fp64", Optional<StringRef>("cl_khr_fp64")) | ||
| 362 | + .Default(Optional<StringRef>()); | ||
| 363 | + } | ||
| 364 | + | ||
| 365 | + // Same as above but for extensions | ||
| 366 | + llvm::Optional<StringRef> getEquivalentFeature(StringRef Extension) const { | ||
| 367 | + return llvm::StringSwitch<llvm::Optional<StringRef>>(Extension) | ||
| 368 | + .Case("cl_khr_3d_image_writes", | ||
| 369 | + Optional<StringRef>("__opencl_c_3d_image_writes")) | ||
| 370 | + .Case("cl_khr_subgroups", Optional<StringRef>("__opencl_c_subgroups")) | ||
| 371 | + .Case("cl_khr_fp64", Optional<StringRef>("__opencl_c_fp64")) | ||
| 372 | + .Default(Optional<StringRef>()); | ||
| 373 | + } | ||
| 374 | + | ||
| 375 | + bool isFeature(llvm::StringRef Ext) const { | ||
| 376 | + return Ext.startswith("__opencl_c"); | ||
| 377 | + } | ||
| 378 | + | ||
| 379 | bool isKnown(llvm::StringRef Ext) const { | ||
| 380 | return OptMap.find(Ext) != OptMap.end(); | ||
| 381 | } | ||
| 382 | @@ -42,32 +77,88 @@ public: | ||
| 383 | |||
| 384 | // Is supported as either an extension or an (optional) core feature for | ||
| 385 | // OpenCL version \p CLVer. | ||
| 386 | - bool isSupported(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 387 | + bool isSupported(llvm::StringRef Ext) const { | ||
| 388 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 389 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 390 | auto I = OptMap.find(Ext)->getValue(); | ||
| 391 | return I.Supported && I.Avail <= CLVer; | ||
| 392 | } | ||
| 393 | |||
| 394 | // Is supported (optional) OpenCL core features for OpenCL version \p CLVer. | ||
| 395 | // For supported extension, return false. | ||
| 396 | - bool isSupportedCore(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 397 | + bool isSupportedCore(llvm::StringRef Ext) const { | ||
| 398 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 399 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 400 | auto I = OptMap.find(Ext)->getValue(); | ||
| 401 | return I.Supported && I.Avail <= CLVer && I.Core != ~0U && CLVer >= I.Core; | ||
| 402 | } | ||
| 403 | |||
| 404 | // Is supported OpenCL extension for OpenCL version \p CLVer. | ||
| 405 | // For supported (optional) core feature, return false. | ||
| 406 | - bool isSupportedExtension(llvm::StringRef Ext, const LangOptions &LO) const { | ||
| 407 | + bool isSupportedExtension(llvm::StringRef Ext) const { | ||
| 408 | // In C++ mode all extensions should work at least as in v2.0. | ||
| 409 | - auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 410 | auto I = OptMap.find(Ext)->getValue(); | ||
| 411 | return I.Supported && I.Avail <= CLVer && (I.Core == ~0U || CLVer < I.Core); | ||
| 412 | } | ||
| 413 | |||
| 414 | + // Support features whose support is directly related to the | ||
| 415 | + // specific OpenCL version. For example, OpenCL 2.0 supports | ||
| 416 | + // all features that are optional in 3.0 | ||
| 417 | + void adjustFeatures() { | ||
| 418 | + // Support int64 by default (assume compiling for FULL profile) | ||
| 419 | + OptMap["__opencl_c_int64"].Supported = true; | ||
| 420 | + | ||
| 421 | + if (CLVer >= 300) { | ||
| 422 | + // Simultaneously support extension and corresponding feature | ||
| 423 | + for (llvm::StringRef F : | ||
| 424 | + {"__opencl_c_subgroups", "__opencl_c_3d_image_writes", | ||
| 425 | + "__opencl_c_fp64"}) { | ||
| 426 | + auto Ext = getEquivalentExtension(F); | ||
| 427 | + OptMap[*Ext].Supported = OptMap[F].Supported; | ||
| 428 | + } | ||
| 429 | + | ||
| 430 | + // OpenCL C compilers that define the feature macro __opencl_c_pipes or | ||
| 431 | + // or __opencl_c_device_enqueue must also define the | ||
| 432 | + // feature macro __opencl_c_generic_address_space. | ||
| 433 | + if (OptMap["__opencl_c_pipes"].Supported || | ||
| 434 | + OptMap["__opencl_c_device_enqueue"].Supported) | ||
| 435 | + OptMap["__opencl_c_generic_address_space"].Supported = true; | ||
| 436 | + | ||
| 437 | + // OpenCL C compilers that define the feature macro | ||
| 438 | + // __opencl_c_3d_image_writes or __opencl_c_read_write_images must also | ||
| 439 | + // define the feature macro __opencl_c_images | ||
| 440 | + if (OptMap["__opencl_c_3d_image_writes"].Supported || | ||
| 441 | + OptMap["__opencl_c_read_write_images"].Supported) | ||
| 442 | + OptMap["__opencl_c_images"].Supported = true; | ||
| 443 | + | ||
| 444 | + // All other features are already supported with options | ||
| 445 | + // or in target settings | ||
| 446 | + return; | ||
| 447 | + } | ||
| 448 | + | ||
| 449 | + auto FeaturesRange = llvm::make_filter_range( | ||
| 450 | + OptMap, [&](llvm::StringMapEntry<Info> &OptVal) { | ||
| 451 | + auto Opt = OptVal.getKey(); | ||
| 452 | + return isFeature(Opt); | ||
| 453 | + }); | ||
| 454 | + | ||
| 455 | + for (auto &It : FeaturesRange) { | ||
| 456 | + auto &Info = It.getValue(); | ||
| 457 | + // For OpenCL version less then 3.0 some | ||
| 458 | + // features should be supported simulateneously | ||
| 459 | + // with specific extension | ||
| 460 | + if (Optional<llvm::StringRef> Ext = getEquivalentExtension(It.getKey())) | ||
| 461 | + Info.Supported = Info.Enabled = OptMap[*Ext].Supported; | ||
| 462 | + else if (Info.Avail <= CLVer) | ||
| 463 | + Info.Supported = Info.Enabled = true; | ||
| 464 | + } | ||
| 465 | + } | ||
| 466 | + | ||
| 467 | void enable(llvm::StringRef Ext, bool V = true) { | ||
| 468 | + // Ignore disabling extensions if corresponding features | ||
| 469 | + // already supported for OpenCL version higher then 3.0 | ||
| 470 | + if (CLVer >= 300) | ||
| 471 | + if (Optional<llvm::StringRef> F = getEquivalentFeature(Ext)) | ||
| 472 | + if (V != OptMap[*F].Enabled) | ||
| 473 | + return; | ||
| 474 | OptMap[Ext].Enabled = V; | ||
| 475 | } | ||
| 476 | |||
| 477 | @@ -96,7 +187,7 @@ public: | ||
| 478 | OptMap[Ext].Supported = V; | ||
| 479 | } | ||
| 480 | |||
| 481 | - OpenCLOptions(){ | ||
| 482 | + OpenCLOptions() { | ||
| 483 | #define OPENCLEXT_INTERNAL(Ext, AvailVer, CoreVer) \ | ||
| 484 | OptMap[#Ext].Avail = AvailVer; \ | ||
| 485 | OptMap[#Ext].Core = CoreVer; | ||
| 486 | @@ -104,35 +195,86 @@ public: | ||
| 487 | } | ||
| 488 | |||
| 489 | void addSupport(const OpenCLOptions &Opts) { | ||
| 490 | + assert(IsOpenCLCPlusPlus == Opts.IsOpenCLCPlusPlus && CLVer == Opts.CLVer); | ||
| 491 | for (auto &I:Opts.OptMap) | ||
| 492 | - if (I.second.Supported) | ||
| 493 | + if (I.second.Supported) { | ||
| 494 | OptMap[I.getKey()].Supported = true; | ||
| 495 | + // All features are enabled as they are supported | ||
| 496 | + if (isFeature(I.getKey())) | ||
| 497 | + OptMap[I.getKey()].Enabled = true; | ||
| 498 | + } | ||
| 499 | + if (CLVer >= 300) { | ||
| 500 | + // Enabling extensions with respect to features | ||
| 501 | + for (llvm::StringRef Ext : | ||
| 502 | + {"cl_khr_3d_image_writes", "cl_khr_subgroups", "cl_khr_fp64"}) { | ||
| 503 | + auto Feature = getEquivalentFeature(Ext); | ||
| 504 | + enable(Ext, OptMap[*Feature].Enabled); | ||
| 505 | + } | ||
| 506 | + } | ||
| 507 | } | ||
| 508 | |||
| 509 | void copy(const OpenCLOptions &Opts) { | ||
| 510 | + CLVer = Opts.CLVer; | ||
| 511 | + IsOpenCLCPlusPlus = Opts.IsOpenCLCPlusPlus; | ||
| 512 | OptMap = Opts.OptMap; | ||
| 513 | } | ||
| 514 | |||
| 515 | // Turn on or off support of all options. | ||
| 516 | void supportAll(bool On = true) { | ||
| 517 | - for (llvm::StringMap<Info>::iterator I = OptMap.begin(), | ||
| 518 | - E = OptMap.end(); I != E; ++I) | ||
| 519 | - I->second.Supported = On; | ||
| 520 | + for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 521 | + I != E; ++I) | ||
| 522 | + if (!isFeature(I->getKey())) | ||
| 523 | + I->second.Supported = On; | ||
| 524 | } | ||
| 525 | |||
| 526 | void disableAll() { | ||
| 527 | - for (llvm::StringMap<Info>::iterator I = OptMap.begin(), | ||
| 528 | - E = OptMap.end(); I != E; ++I) | ||
| 529 | - I->second.Enabled = false; | ||
| 530 | + for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 531 | + I != E; ++I) { | ||
| 532 | + auto Ext = I->getKey(); | ||
| 533 | + if (!isFeature(Ext)) | ||
| 534 | + enable(Ext, false); | ||
| 535 | + } | ||
| 536 | } | ||
| 537 | |||
| 538 | - void enableSupportedCore(LangOptions LO) { | ||
| 539 | + void enableSupportedCore() { | ||
| 540 | for (llvm::StringMap<Info>::iterator I = OptMap.begin(), E = OptMap.end(); | ||
| 541 | I != E; ++I) | ||
| 542 | - if (isSupportedCore(I->getKey(), LO)) | ||
| 543 | + if (isSupportedCore(I->getKey())) | ||
| 544 | I->second.Enabled = true; | ||
| 545 | } | ||
| 546 | |||
| 547 | + // This enum specifies how OpenCL versions map into values | ||
| 548 | + // for encoding. This is used when generating built-ins | ||
| 549 | + // from tablegen | ||
| 550 | + enum OpenCLVersionsEncodings : unsigned short { | ||
| 551 | + OPENCL_C_100_CODE = 0x1, | ||
| 552 | + OPENCL_C_110_CODE = 0x2, | ||
| 553 | + OPENCL_C_120_CODE = 0x4, | ||
| 554 | + OPENCL_C_200_CODE = 0x8, | ||
| 555 | + OPENCL_C_300_CODE = 0x10, | ||
| 556 | + OPENCL_C_ALL_CODE = 0x1f | ||
| 557 | + }; | ||
| 558 | + | ||
| 559 | + // Encode version into single integer | ||
| 560 | + static unsigned short EncodeVersion(unsigned OpenCLVersion) { | ||
| 561 | + switch (OpenCLVersion) { | ||
| 562 | + default: | ||
| 563 | + llvm_unreachable("Unknown OpenCL version"); | ||
| 564 | + case 0: | ||
| 565 | + return OpenCLVersionsEncodings::OPENCL_C_ALL_CODE; | ||
| 566 | + case 100: | ||
| 567 | + return OpenCLVersionsEncodings::OPENCL_C_100_CODE; | ||
| 568 | + case 110: | ||
| 569 | + return OpenCLVersionsEncodings::OPENCL_C_110_CODE; | ||
| 570 | + case 120: | ||
| 571 | + return OpenCLVersionsEncodings::OPENCL_C_120_CODE; | ||
| 572 | + case 200: | ||
| 573 | + return OpenCLVersionsEncodings::OPENCL_C_200_CODE; | ||
| 574 | + case 300: | ||
| 575 | + return OpenCLVersionsEncodings::OPENCL_C_300_CODE; | ||
| 576 | + } | ||
| 577 | + } | ||
| 578 | + | ||
| 579 | friend class ASTWriter; | ||
| 580 | friend class ASTReader; | ||
| 581 | }; | ||
| 582 | diff --git a/clang/include/clang/Driver/Options.td b/clang/include/clang/Driver/Options.td | ||
| 583 | index 966cb907b7e2..62536f2470c2 100644 | ||
| 584 | --- a/clang/include/clang/Driver/Options.td | ||
| 585 | +++ b/clang/include/clang/Driver/Options.td | ||
| 586 | @@ -557,7 +557,7 @@ def cl_mad_enable : Flag<["-"], "cl-mad-enable">, Group<opencl_Group>, Flags<[CC | ||
| 587 | def cl_no_signed_zeros : Flag<["-"], "cl-no-signed-zeros">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 588 | HelpText<"OpenCL only. Allow use of less precise no signed zeros computations in the generated binary.">; | ||
| 589 | def cl_std_EQ : Joined<["-"], "cl-std=">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 590 | - HelpText<"OpenCL language standard to compile for.">, Values<"cl,CL,cl1.1,CL1.1,cl1.2,CL1.2,cl2.0,CL2.0,clc++,CLC++">; | ||
| 591 | + HelpText<"OpenCL language standard to compile for.">, Values<"cl,CL,cl1.1,CL1.1,cl1.2,CL1.2,cl2.0,CL2.0,cl3.0,CL3.0,clc++,CLC++">; | ||
| 592 | def cl_denorms_are_zero : Flag<["-"], "cl-denorms-are-zero">, Group<opencl_Group>, | ||
| 593 | HelpText<"OpenCL only. Allow denormals to be flushed to zero.">; | ||
| 594 | def cl_fp32_correctly_rounded_divide_sqrt : Flag<["-"], "cl-fp32-correctly-rounded-divide-sqrt">, Group<opencl_Group>, Flags<[CC1Option]>, | ||
| 595 | diff --git a/clang/include/clang/Sema/Sema.h b/clang/include/clang/Sema/Sema.h | ||
| 596 | index 16a7084f6b08..5920c27229d8 100644 | ||
| 597 | --- a/clang/include/clang/Sema/Sema.h | ||
| 598 | +++ b/clang/include/clang/Sema/Sema.h | ||
| 599 | @@ -9930,6 +9930,10 @@ public: | ||
| 600 | /// \return true if type is disabled. | ||
| 601 | bool checkOpenCLDisabledDecl(const NamedDecl &D, const Expr &E); | ||
| 602 | |||
| 603 | + bool checkOpenCLSubgroupExtForCallExpr(CallExpr *Call); | ||
| 604 | + | ||
| 605 | + bool isSupportedOpenCLOMemoryOrdering(int64_t Ordering) const; | ||
| 606 | + | ||
| 607 | //===--------------------------------------------------------------------===// | ||
| 608 | // OpenMP directives and clauses. | ||
| 609 | // | ||
| 610 | @@ -11527,6 +11531,11 @@ public: | ||
| 611 | /// that the user intended an assignment used as condition. | ||
| 612 | void DiagnoseEqualityWithExtraParens(ParenExpr *ParenE); | ||
| 613 | |||
| 614 | + template <typename DiagLocT, typename DiagInfoT> | ||
| 615 | + void DiagnoseOpenCLRequiresOption(llvm::StringRef OpenCLOptName, | ||
| 616 | + DiagLocT DiagLoc, DiagInfoT DiagInfo, | ||
| 617 | + unsigned Selector, SourceRange SrcRange); | ||
| 618 | + | ||
| 619 | /// CheckCXXBooleanCondition - Returns true if conversion to bool is invalid. | ||
| 620 | ExprResult CheckCXXBooleanCondition(Expr *CondExpr, bool IsConstexpr = false); | ||
| 621 | |||
| 622 | diff --git a/clang/lib/AST/ASTContext.cpp b/clang/lib/AST/ASTContext.cpp | ||
| 623 | index bf51d35d9693..a54ea8475d7d 100644 | ||
| 624 | --- a/clang/lib/AST/ASTContext.cpp | ||
| 625 | +++ b/clang/lib/AST/ASTContext.cpp | ||
| 626 | @@ -1433,7 +1433,8 @@ void ASTContext::InitBuiltinTypes(const TargetInfo &Target, | ||
| 627 | ObjCSuperType = QualType(); | ||
| 628 | |||
| 629 | // void * type | ||
| 630 | - if (LangOpts.OpenCLVersion >= 200) { | ||
| 631 | + if (Target.getSupportedOpenCLOpts().isEnabled( | ||
| 632 | + "__opencl_c_generic_address_space")) { | ||
| 633 | auto Q = VoidTy.getQualifiers(); | ||
| 634 | Q.setAddressSpace(LangAS::opencl_generic); | ||
| 635 | VoidPtrTy = getPointerType(getCanonicalType( | ||
| 636 | diff --git a/clang/lib/Basic/Builtins.cpp b/clang/lib/Basic/Builtins.cpp | ||
| 637 | index 0cd89df41b67..7a3067345098 100644 | ||
| 638 | --- a/clang/lib/Basic/Builtins.cpp | ||
| 639 | +++ b/clang/lib/Basic/Builtins.cpp | ||
| 640 | @@ -23,6 +23,8 @@ static const Builtin::Info BuiltinInfo[] = { | ||
| 641 | { #ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, nullptr }, | ||
| 642 | #define LANGBUILTIN(ID, TYPE, ATTRS, LANGS) \ | ||
| 643 | { #ID, TYPE, ATTRS, nullptr, LANGS, nullptr }, | ||
| 644 | +#define OPENCLBUILTIN(ID, TYPE, ATTRS, LANGS, FEATURE) \ | ||
| 645 | + {#ID, TYPE, ATTRS, nullptr, LANGS, FEATURE}, | ||
| 646 | #define LIBBUILTIN(ID, TYPE, ATTRS, HEADER, LANGS) \ | ||
| 647 | { #ID, TYPE, ATTRS, HEADER, LANGS, nullptr }, | ||
| 648 | #include "clang/Basic/Builtins.def" | ||
| 649 | @@ -69,16 +71,17 @@ bool Builtin::Context::builtinIsSupported(const Builtin::Info &BuiltinInfo, | ||
| 650 | bool ObjCUnsupported = !LangOpts.ObjC && BuiltinInfo.Langs == OBJC_LANG; | ||
| 651 | bool OclC1Unsupported = (LangOpts.OpenCLVersion / 100) != 1 && | ||
| 652 | (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES ) == OCLC1X_LANG; | ||
| 653 | - bool OclC2Unsupported = | ||
| 654 | - (LangOpts.OpenCLVersion != 200 && !LangOpts.OpenCLCPlusPlus) && | ||
| 655 | - (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES) == OCLC20_LANG; | ||
| 656 | + bool OclC2PUnsupported = | ||
| 657 | + (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES) == OCLC2P_LANG && | ||
| 658 | + ((LangOpts.OpenCLVersion < 200 && !LangOpts.OpenCLCPlusPlus) || | ||
| 659 | + !OclBuiltinIsSupported(BuiltinInfo, LangOpts)); | ||
| 660 | bool OclCUnsupported = !LangOpts.OpenCL && | ||
| 661 | (BuiltinInfo.Langs & ALL_OCLC_LANGUAGES); | ||
| 662 | bool OpenMPUnsupported = !LangOpts.OpenMP && BuiltinInfo.Langs == OMP_LANG; | ||
| 663 | bool CPlusPlusUnsupported = | ||
| 664 | !LangOpts.CPlusPlus && BuiltinInfo.Langs == CXX_LANG; | ||
| 665 | return !BuiltinsUnsupported && !MathBuiltinsUnsupported && !OclCUnsupported && | ||
| 666 | - !OclC1Unsupported && !OclC2Unsupported && !OpenMPUnsupported && | ||
| 667 | + !OclC1Unsupported && !OclC2PUnsupported && !OpenMPUnsupported && | ||
| 668 | !GnuModeUnsupported && !MSModeUnsupported && !ObjCUnsupported && | ||
| 669 | !CPlusPlusUnsupported; | ||
| 670 | } | ||
| 671 | @@ -191,3 +194,20 @@ bool Builtin::Context::canBeRedeclared(unsigned ID) const { | ||
| 672 | (!hasReferenceArgsOrResult(ID) && | ||
| 673 | !hasCustomTypechecking(ID)); | ||
| 674 | } | ||
| 675 | + | ||
| 676 | +bool Builtin::Context::OclBuiltinIsSupported( | ||
| 677 | + const Builtin::Info &BuiltinInfo, const LangOptions &LangOpts) const { | ||
| 678 | + if (!requiresFeatures(BuiltinInfo)) | ||
| 679 | + return true; | ||
| 680 | + | ||
| 681 | + return llvm::StringSwitch<bool>(BuiltinInfo.Features) | ||
| 682 | + .Case("__opencl_c_device_enqueue", LangOpts.Blocks) | ||
| 683 | + .Case("__opencl_c_generic_address_space", LangOpts.OpenCLGenericKeyword) | ||
| 684 | + .Case("__opencl_c_pipes", LangOpts.OpenCLPipeKeyword) | ||
| 685 | + .Default(false); | ||
| 686 | +} | ||
| 687 | + | ||
| 688 | +bool Builtin::Context::requiresFeatures( | ||
| 689 | + const Builtin::Info &BuiltinInfo) const { | ||
| 690 | + return BuiltinInfo.Features && llvm::StringRef(BuiltinInfo.Features) != ""; | ||
| 691 | +} | ||
| 692 | diff --git a/clang/lib/Basic/TargetInfo.cpp b/clang/lib/Basic/TargetInfo.cpp | ||
| 693 | index eccdc21d724a..6b4f524d5271 100644 | ||
| 694 | --- a/clang/lib/Basic/TargetInfo.cpp | ||
| 695 | +++ b/clang/lib/Basic/TargetInfo.cpp | ||
| 696 | @@ -387,6 +387,17 @@ void TargetInfo::adjust(LangOptions &Opts) { | ||
| 697 | HalfFormat = &llvm::APFloat::IEEEhalf(); | ||
| 698 | FloatFormat = &llvm::APFloat::IEEEsingle(); | ||
| 699 | LongDoubleFormat = &llvm::APFloat::IEEEquad(); | ||
| 700 | + | ||
| 701 | + auto &SupportedOCLOpts = getTargetOpts().SupportedOpenCLOptions; | ||
| 702 | + | ||
| 703 | + SupportedOCLOpts.setOpenCLVersion(Opts); | ||
| 704 | + SupportedOCLOpts.adjustFeatures(); | ||
| 705 | + | ||
| 706 | + if (!Opts.OpenCLCPlusPlus && Opts.OpenCLVersion >= 200) | ||
| 707 | + Opts.Blocks = SupportedOCLOpts.isSupported("__opencl_c_device_enqueue"); | ||
| 708 | + Opts.OpenCLGenericKeyword = | ||
| 709 | + SupportedOCLOpts.isSupported("__opencl_c_generic_address_space"); | ||
| 710 | + Opts.OpenCLPipeKeyword = SupportedOCLOpts.isSupported("__opencl_c_pipes"); | ||
| 711 | } | ||
| 712 | |||
| 713 | if (Opts.DoubleSize) { | ||
| 714 | diff --git a/clang/lib/Basic/Targets.cpp b/clang/lib/Basic/Targets.cpp | ||
| 715 | index 965f273892bd..046d7c15f835 100644 | ||
| 716 | --- a/clang/lib/Basic/Targets.cpp | ||
| 717 | +++ b/clang/lib/Basic/Targets.cpp | ||
| 718 | @@ -40,7 +40,6 @@ | ||
| 719 | #include "clang/Basic/Diagnostic.h" | ||
| 720 | #include "llvm/ADT/StringExtras.h" | ||
| 721 | #include "llvm/ADT/Triple.h" | ||
| 722 | - | ||
| 723 | using namespace clang; | ||
| 724 | |||
| 725 | namespace clang { | ||
| 726 | diff --git a/clang/lib/CodeGen/CodeGenFunction.cpp b/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 727 | index 8ce488f35dd3..ca4cb0fbf018 100644 | ||
| 728 | --- a/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 729 | +++ b/clang/lib/CodeGen/CodeGenFunction.cpp | ||
| 730 | @@ -2306,11 +2306,11 @@ void CodeGenFunction::checkTargetFeatures(SourceLocation Loc, | ||
| 731 | std::string MissingFeature; | ||
| 732 | if (BuiltinID) { | ||
| 733 | SmallVector<StringRef, 1> ReqFeatures; | ||
| 734 | - const char *FeatureList = | ||
| 735 | - CGM.getContext().BuiltinInfo.getRequiredFeatures(BuiltinID); | ||
| 736 | // Return if the builtin doesn't have any required features. | ||
| 737 | - if (!FeatureList || StringRef(FeatureList) == "") | ||
| 738 | + if (!CGM.getContext().BuiltinInfo.requiresFeatures(BuiltinID)) | ||
| 739 | return; | ||
| 740 | + const char *FeatureList = | ||
| 741 | + CGM.getContext().BuiltinInfo.getRequiredFeatures(BuiltinID); | ||
| 742 | StringRef(FeatureList).split(ReqFeatures, ','); | ||
| 743 | if (!hasRequiredFeatures(ReqFeatures, CGM, FD, MissingFeature)) | ||
| 744 | CGM.getDiags().Report(Loc, diag::err_builtin_needs_feature) | ||
| 745 | diff --git a/clang/lib/Frontend/CompilerInvocation.cpp b/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 746 | index 73114c6d76cb..bc54d231b97a 100644 | ||
| 747 | --- a/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 748 | +++ b/clang/lib/Frontend/CompilerInvocation.cpp | ||
| 749 | @@ -2344,6 +2344,8 @@ void CompilerInvocation::setLangDefaults(LangOptions &Opts, InputKind IK, | ||
| 750 | Opts.OpenCLVersion = 120; | ||
| 751 | else if (LangStd == LangStandard::lang_opencl20) | ||
| 752 | Opts.OpenCLVersion = 200; | ||
| 753 | + else if (LangStd == LangStandard::lang_opencl30) | ||
| 754 | + Opts.OpenCLVersion = 300; | ||
| 755 | else if (LangStd == LangStandard::lang_openclcpp) | ||
| 756 | Opts.OpenCLCPlusPlusVersion = 100; | ||
| 757 | |||
| 758 | @@ -2544,14 +2546,15 @@ static void ParseLangArgs(LangOptions &Opts, ArgList &Args, InputKind IK, | ||
| 759 | // -cl-std only applies for OpenCL language standards. | ||
| 760 | // Override the -std option in this case. | ||
| 761 | if (const Arg *A = Args.getLastArg(OPT_cl_std_EQ)) { | ||
| 762 | - LangStandard::Kind OpenCLLangStd | ||
| 763 | - = llvm::StringSwitch<LangStandard::Kind>(A->getValue()) | ||
| 764 | - .Cases("cl", "CL", LangStandard::lang_opencl10) | ||
| 765 | - .Cases("cl1.1", "CL1.1", LangStandard::lang_opencl11) | ||
| 766 | - .Cases("cl1.2", "CL1.2", LangStandard::lang_opencl12) | ||
| 767 | - .Cases("cl2.0", "CL2.0", LangStandard::lang_opencl20) | ||
| 768 | - .Cases("clc++", "CLC++", LangStandard::lang_openclcpp) | ||
| 769 | - .Default(LangStandard::lang_unspecified); | ||
| 770 | + LangStandard::Kind OpenCLLangStd = | ||
| 771 | + llvm::StringSwitch<LangStandard::Kind>(A->getValue()) | ||
| 772 | + .Cases("cl", "CL", LangStandard::lang_opencl10) | ||
| 773 | + .Cases("cl1.1", "CL1.1", LangStandard::lang_opencl11) | ||
| 774 | + .Cases("cl1.2", "CL1.2", LangStandard::lang_opencl12) | ||
| 775 | + .Cases("cl2.0", "CL2.0", LangStandard::lang_opencl20) | ||
| 776 | + .Cases("cl3.0", "CL3.0", LangStandard::lang_opencl30) | ||
| 777 | + .Cases("clc++", "CLC++", LangStandard::lang_openclcpp) | ||
| 778 | + .Default(LangStandard::lang_unspecified); | ||
| 779 | |||
| 780 | if (OpenCLLangStd == LangStandard::lang_unspecified) { | ||
| 781 | Diags.Report(diag::err_drv_invalid_value) | ||
| 782 | @@ -2852,8 +2855,7 @@ static void ParseLangArgs(LangOptions &Opts, ArgList &Args, InputKind IK, | ||
| 783 | |||
| 784 | Opts.RTTI = Opts.CPlusPlus && !Args.hasArg(OPT_fno_rtti); | ||
| 785 | Opts.RTTIData = Opts.RTTI && !Args.hasArg(OPT_fno_rtti_data); | ||
| 786 | - Opts.Blocks = Args.hasArg(OPT_fblocks) || (Opts.OpenCL | ||
| 787 | - && Opts.OpenCLVersion == 200); | ||
| 788 | + Opts.Blocks = Args.hasArg(OPT_fblocks); | ||
| 789 | Opts.BlocksRuntimeOptional = Args.hasArg(OPT_fblocks_runtime_optional); | ||
| 790 | Opts.Coroutines = Opts.CPlusPlus20 || Args.hasArg(OPT_fcoroutines_ts); | ||
| 791 | |||
| 792 | diff --git a/clang/lib/Frontend/InitPreprocessor.cpp b/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 793 | index 6eef1e2376f6..5bb489c11909 100644 | ||
| 794 | --- a/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 795 | +++ b/clang/lib/Frontend/InitPreprocessor.cpp | ||
| 796 | @@ -445,6 +445,9 @@ static void InitializeStandardPredefinedMacros(const TargetInfo &TI, | ||
| 797 | case 200: | ||
| 798 | Builder.defineMacro("__OPENCL_C_VERSION__", "200"); | ||
| 799 | break; | ||
| 800 | + case 300: | ||
| 801 | + Builder.defineMacro("__OPENCL_C_VERSION__", "300"); | ||
| 802 | + break; | ||
| 803 | default: | ||
| 804 | llvm_unreachable("Unsupported OpenCL version"); | ||
| 805 | } | ||
| 806 | @@ -453,6 +456,7 @@ static void InitializeStandardPredefinedMacros(const TargetInfo &TI, | ||
| 807 | Builder.defineMacro("CL_VERSION_1_1", "110"); | ||
| 808 | Builder.defineMacro("CL_VERSION_1_2", "120"); | ||
| 809 | Builder.defineMacro("CL_VERSION_2_0", "200"); | ||
| 810 | + Builder.defineMacro("CL_VERSION_3_0", "300"); | ||
| 811 | |||
| 812 | if (TI.isLittleEndian()) | ||
| 813 | Builder.defineMacro("__ENDIAN_LITTLE__"); | ||
| 814 | @@ -1108,7 +1112,7 @@ static void InitializePredefinedMacros(const TargetInfo &TI, | ||
| 815 | // OpenCL definitions. | ||
| 816 | if (LangOpts.OpenCL) { | ||
| 817 | #define OPENCLEXT(Ext) \ | ||
| 818 | - if (TI.getSupportedOpenCLOpts().isSupported(#Ext, LangOpts)) \ | ||
| 819 | + if (TI.getSupportedOpenCLOpts().isSupported(#Ext)) \ | ||
| 820 | Builder.defineMacro(#Ext); | ||
| 821 | #include "clang/Basic/OpenCLExtensions.def" | ||
| 822 | |||
| 823 | diff --git a/clang/lib/Headers/opencl-c-base.h b/clang/lib/Headers/opencl-c-base.h | ||
| 824 | index 430e07d36f62..afa900ab24d9 100644 | ||
| 825 | --- a/clang/lib/Headers/opencl-c-base.h | ||
| 826 | +++ b/clang/lib/Headers/opencl-c-base.h | ||
| 827 | @@ -9,6 +9,59 @@ | ||
| 828 | #ifndef _OPENCL_BASE_H_ | ||
| 829 | #define _OPENCL_BASE_H_ | ||
| 830 | |||
| 831 | +// Add predefined macros to build headers with standalone executable | ||
| 832 | +#ifndef CL_VERSION_3_0 | ||
| 833 | + #define CL_VERSION_3_0 300 | ||
| 834 | +#endif | ||
| 835 | + | ||
| 836 | +// Define features for 2.0 for header backward compatibility | ||
| 837 | +#ifndef __opencl_c_int64 | ||
| 838 | + #define __opencl_c_int64 1 | ||
| 839 | +#endif | ||
| 840 | +#if __OPENCL_C_VERSION__ != CL_VERSION_3_0 | ||
| 841 | + #ifndef __opencl_c_images | ||
| 842 | + #define __opencl_c_images 1 | ||
| 843 | + #endif | ||
| 844 | +#endif | ||
| 845 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 846 | +#ifndef __opencl_c_pipes | ||
| 847 | + #define __opencl_c_pipes 1 | ||
| 848 | +#endif | ||
| 849 | +#ifndef __opencl_c_generic_address_space | ||
| 850 | + #define __opencl_c_generic_address_space 1 | ||
| 851 | +#endif | ||
| 852 | +#ifndef __opencl_c_work_group_collective_functions | ||
| 853 | + #define __opencl_c_work_group_collective_functions 1 | ||
| 854 | +#endif | ||
| 855 | +#ifndef __opencl_c_atomic_order_acq_rel | ||
| 856 | + #define __opencl_c_atomic_order_acq_rel 1 | ||
| 857 | +#endif | ||
| 858 | +#ifndef __opencl_c_atomic_order_seq_cst | ||
| 859 | + #define __opencl_c_atomic_order_seq_cst 1 | ||
| 860 | +#endif | ||
| 861 | +#ifndef __opencl_c_atomic_scope_device | ||
| 862 | + #define __opencl_c_atomic_scope_device 1 | ||
| 863 | +#endif | ||
| 864 | +#ifndef __opencl_c_atomic_scope_all_devices | ||
| 865 | + #define __opencl_c_atomic_scope_all_devices 1 | ||
| 866 | +#endif | ||
| 867 | +#ifndef __opencl_c_subgroups | ||
| 868 | + #define __opencl_c_subgroups 1 | ||
| 869 | +#endif | ||
| 870 | +#ifndef __opencl_c_3d_image_writes | ||
| 871 | + #define __opencl_c_3d_image_writes 1 | ||
| 872 | +#endif | ||
| 873 | +#ifndef __opencl_c_device_enqueue | ||
| 874 | + #define __opencl_c_device_enqueue 1 | ||
| 875 | +#endif | ||
| 876 | +#ifndef __opencl_c_read_write_images | ||
| 877 | + #define __opencl_c_read_write_images 1 | ||
| 878 | +#endif | ||
| 879 | +#ifndef __opencl_c_program_scope_global_variables | ||
| 880 | + #define __opencl_c_program_scope_global_variables 1 | ||
| 881 | +#endif | ||
| 882 | +#endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 883 | + | ||
| 884 | // built-in scalar data types: | ||
| 885 | |||
| 886 | /** | ||
| 887 | @@ -115,7 +168,12 @@ typedef half half4 __attribute__((ext_vector_type(4))); | ||
| 888 | typedef half half8 __attribute__((ext_vector_type(8))); | ||
| 889 | typedef half half16 __attribute__((ext_vector_type(16))); | ||
| 890 | #endif | ||
| 891 | -#ifdef cl_khr_fp64 | ||
| 892 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 893 | + | ||
| 894 | +#ifndef __opencl_c_fp64 | ||
| 895 | + #define __opencl_c_fp64 1 | ||
| 896 | +#endif | ||
| 897 | + | ||
| 898 | #if __OPENCL_C_VERSION__ < CL_VERSION_1_2 | ||
| 899 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 900 | #endif | ||
| 901 | @@ -281,9 +339,17 @@ typedef uint cl_mem_fence_flags; | ||
| 902 | typedef enum memory_scope { | ||
| 903 | memory_scope_work_item = __OPENCL_MEMORY_SCOPE_WORK_ITEM, | ||
| 904 | memory_scope_work_group = __OPENCL_MEMORY_SCOPE_WORK_GROUP, | ||
| 905 | +#ifdef __opencl_c_atomic_scope_device | ||
| 906 | memory_scope_device = __OPENCL_MEMORY_SCOPE_DEVICE, | ||
| 907 | +#endif | ||
| 908 | +#ifdef __opencl_c_atomic_scope_all_devices | ||
| 909 | + #if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 910 | + memory_scope_all_devices = __OPENCL_MEMORY_SCOPE_ALL_SVM_DEVICES, | ||
| 911 | + #endif //(__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 912 | memory_scope_all_svm_devices = __OPENCL_MEMORY_SCOPE_ALL_SVM_DEVICES, | ||
| 913 | -#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) | ||
| 914 | +#endif // __opencl_c_atomic_scope_all_devices | ||
| 915 | +#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) || \ | ||
| 916 | + defined(__opencl_c_subgroups) | ||
| 917 | memory_scope_sub_group = __OPENCL_MEMORY_SCOPE_SUB_GROUP | ||
| 918 | #endif | ||
| 919 | } memory_scope; | ||
| 920 | @@ -301,13 +367,14 @@ typedef enum memory_scope { | ||
| 921 | #define ATOMIC_FLAG_INIT 0 | ||
| 922 | |||
| 923 | // enum values aligned with what clang uses in EmitAtomicExpr() | ||
| 924 | -typedef enum memory_order | ||
| 925 | -{ | ||
| 926 | +typedef enum memory_order { | ||
| 927 | memory_order_relaxed = __ATOMIC_RELAXED, | ||
| 928 | memory_order_acquire = __ATOMIC_ACQUIRE, | ||
| 929 | memory_order_release = __ATOMIC_RELEASE, | ||
| 930 | memory_order_acq_rel = __ATOMIC_ACQ_REL, | ||
| 931 | +#ifdef __opencl_c_atomic_order_seq_cst | ||
| 932 | memory_order_seq_cst = __ATOMIC_SEQ_CST | ||
| 933 | +#endif //__opencl_c_atomic_order_seq_cst | ||
| 934 | } memory_order; | ||
| 935 | |||
| 936 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 937 | diff --git a/clang/lib/Headers/opencl-c.h b/clang/lib/Headers/opencl-c.h | ||
| 938 | index 66e18bdd47bb..67d900eb1c3d 100644 | ||
| 939 | --- a/clang/lib/Headers/opencl-c.h | ||
| 940 | +++ b/clang/lib/Headers/opencl-c.h | ||
| 941 | @@ -35,7 +35,6 @@ | ||
| 942 | #define __purefn __attribute__((pure)) | ||
| 943 | #define __cnfn __attribute__((const)) | ||
| 944 | |||
| 945 | - | ||
| 946 | // OpenCL v1.1/1.2/2.0 s6.2.3 - Explicit conversions | ||
| 947 | |||
| 948 | char __ovld __cnfn convert_char_rte(char); | ||
| 949 | @@ -4632,7 +4631,7 @@ float16 __ovld __cnfn convert_float16(float16); | ||
| 950 | |||
| 951 | // Conversions with double data type parameters or return value. | ||
| 952 | |||
| 953 | -#ifdef cl_khr_fp64 | ||
| 954 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 955 | char __ovld __cnfn convert_char(double); | ||
| 956 | char __ovld __cnfn convert_char_rte(double); | ||
| 957 | char __ovld __cnfn convert_char_rtn(double); | ||
| 958 | @@ -5452,7 +5451,7 @@ double16 __ovld __cnfn convert_double16_rtz(uchar16); | ||
| 959 | double16 __ovld __cnfn convert_double16_rtz(uint16); | ||
| 960 | double16 __ovld __cnfn convert_double16_rtz(ulong16); | ||
| 961 | double16 __ovld __cnfn convert_double16_rtz(ushort16); | ||
| 962 | -#endif //cl_khr_fp64 | ||
| 963 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 964 | |||
| 965 | #ifdef cl_khr_fp16 | ||
| 966 | // Convert half types to non-double types. | ||
| 967 | @@ -6270,7 +6269,7 @@ half16 __ovld __cnfn convert_half16_rtz(float16); | ||
| 968 | half16 __ovld __cnfn convert_half16_rtz(half16); | ||
| 969 | |||
| 970 | // Convert half types to double types. | ||
| 971 | -#ifdef cl_khr_fp64 | ||
| 972 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 973 | double __ovld __cnfn convert_double(half); | ||
| 974 | double __ovld __cnfn convert_double_rte(half); | ||
| 975 | double __ovld __cnfn convert_double_rtp(half); | ||
| 976 | @@ -6333,7 +6332,7 @@ half16 __ovld __cnfn convert_half16_rte(double16); | ||
| 977 | half16 __ovld __cnfn convert_half16_rtp(double16); | ||
| 978 | half16 __ovld __cnfn convert_half16_rtn(double16); | ||
| 979 | half16 __ovld __cnfn convert_half16_rtz(double16); | ||
| 980 | -#endif //cl_khr_fp64 | ||
| 981 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 982 | |||
| 983 | #endif // cl_khr_fp16 | ||
| 984 | |||
| 985 | @@ -6404,14 +6403,14 @@ half16 __ovld __cnfn convert_half16_rtz(double16); | ||
| 986 | #define as_float8(x) __builtin_astype((x), float8) | ||
| 987 | #define as_float16(x) __builtin_astype((x), float16) | ||
| 988 | |||
| 989 | -#ifdef cl_khr_fp64 | ||
| 990 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 991 | #define as_double(x) __builtin_astype((x), double) | ||
| 992 | #define as_double2(x) __builtin_astype((x), double2) | ||
| 993 | #define as_double3(x) __builtin_astype((x), double3) | ||
| 994 | #define as_double4(x) __builtin_astype((x), double4) | ||
| 995 | #define as_double8(x) __builtin_astype((x), double8) | ||
| 996 | #define as_double16(x) __builtin_astype((x), double16) | ||
| 997 | -#endif //cl_khr_fp64 | ||
| 998 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 999 | |||
| 1000 | #ifdef cl_khr_fp16 | ||
| 1001 | #define as_half(x) __builtin_astype((x), half) | ||
| 1002 | @@ -6534,14 +6533,14 @@ float3 __ovld __cnfn acos(float3); | ||
| 1003 | float4 __ovld __cnfn acos(float4); | ||
| 1004 | float8 __ovld __cnfn acos(float8); | ||
| 1005 | float16 __ovld __cnfn acos(float16); | ||
| 1006 | -#ifdef cl_khr_fp64 | ||
| 1007 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1008 | double __ovld __cnfn acos(double); | ||
| 1009 | double2 __ovld __cnfn acos(double2); | ||
| 1010 | double3 __ovld __cnfn acos(double3); | ||
| 1011 | double4 __ovld __cnfn acos(double4); | ||
| 1012 | double8 __ovld __cnfn acos(double8); | ||
| 1013 | double16 __ovld __cnfn acos(double16); | ||
| 1014 | -#endif //cl_khr_fp64 | ||
| 1015 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1016 | #ifdef cl_khr_fp16 | ||
| 1017 | half __ovld __cnfn acos(half); | ||
| 1018 | half2 __ovld __cnfn acos(half2); | ||
| 1019 | @@ -6560,14 +6559,14 @@ float3 __ovld __cnfn acosh(float3); | ||
| 1020 | float4 __ovld __cnfn acosh(float4); | ||
| 1021 | float8 __ovld __cnfn acosh(float8); | ||
| 1022 | float16 __ovld __cnfn acosh(float16); | ||
| 1023 | -#ifdef cl_khr_fp64 | ||
| 1024 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1025 | double __ovld __cnfn acosh(double); | ||
| 1026 | double2 __ovld __cnfn acosh(double2); | ||
| 1027 | double3 __ovld __cnfn acosh(double3); | ||
| 1028 | double4 __ovld __cnfn acosh(double4); | ||
| 1029 | double8 __ovld __cnfn acosh(double8); | ||
| 1030 | double16 __ovld __cnfn acosh(double16); | ||
| 1031 | -#endif //cl_khr_fp64 | ||
| 1032 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1033 | #ifdef cl_khr_fp16 | ||
| 1034 | half __ovld __cnfn acosh(half); | ||
| 1035 | half2 __ovld __cnfn acosh(half2); | ||
| 1036 | @@ -6586,14 +6585,14 @@ float3 __ovld __cnfn acospi(float3 x); | ||
| 1037 | float4 __ovld __cnfn acospi(float4 x); | ||
| 1038 | float8 __ovld __cnfn acospi(float8 x); | ||
| 1039 | float16 __ovld __cnfn acospi(float16 x); | ||
| 1040 | -#ifdef cl_khr_fp64 | ||
| 1041 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1042 | double __ovld __cnfn acospi(double x); | ||
| 1043 | double2 __ovld __cnfn acospi(double2 x); | ||
| 1044 | double3 __ovld __cnfn acospi(double3 x); | ||
| 1045 | double4 __ovld __cnfn acospi(double4 x); | ||
| 1046 | double8 __ovld __cnfn acospi(double8 x); | ||
| 1047 | double16 __ovld __cnfn acospi(double16 x); | ||
| 1048 | -#endif //cl_khr_fp64 | ||
| 1049 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1050 | #ifdef cl_khr_fp16 | ||
| 1051 | half __ovld __cnfn acospi(half x); | ||
| 1052 | half2 __ovld __cnfn acospi(half2 x); | ||
| 1053 | @@ -6612,14 +6611,14 @@ float3 __ovld __cnfn asin(float3); | ||
| 1054 | float4 __ovld __cnfn asin(float4); | ||
| 1055 | float8 __ovld __cnfn asin(float8); | ||
| 1056 | float16 __ovld __cnfn asin(float16); | ||
| 1057 | -#ifdef cl_khr_fp64 | ||
| 1058 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1059 | double __ovld __cnfn asin(double); | ||
| 1060 | double2 __ovld __cnfn asin(double2); | ||
| 1061 | double3 __ovld __cnfn asin(double3); | ||
| 1062 | double4 __ovld __cnfn asin(double4); | ||
| 1063 | double8 __ovld __cnfn asin(double8); | ||
| 1064 | double16 __ovld __cnfn asin(double16); | ||
| 1065 | -#endif //cl_khr_fp64 | ||
| 1066 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1067 | #ifdef cl_khr_fp16 | ||
| 1068 | half __ovld __cnfn asin(half); | ||
| 1069 | half2 __ovld __cnfn asin(half2); | ||
| 1070 | @@ -6638,14 +6637,14 @@ float3 __ovld __cnfn asinh(float3); | ||
| 1071 | float4 __ovld __cnfn asinh(float4); | ||
| 1072 | float8 __ovld __cnfn asinh(float8); | ||
| 1073 | float16 __ovld __cnfn asinh(float16); | ||
| 1074 | -#ifdef cl_khr_fp64 | ||
| 1075 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1076 | double __ovld __cnfn asinh(double); | ||
| 1077 | double2 __ovld __cnfn asinh(double2); | ||
| 1078 | double3 __ovld __cnfn asinh(double3); | ||
| 1079 | double4 __ovld __cnfn asinh(double4); | ||
| 1080 | double8 __ovld __cnfn asinh(double8); | ||
| 1081 | double16 __ovld __cnfn asinh(double16); | ||
| 1082 | -#endif //cl_khr_fp64 | ||
| 1083 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1084 | #ifdef cl_khr_fp16 | ||
| 1085 | half __ovld __cnfn asinh(half); | ||
| 1086 | half2 __ovld __cnfn asinh(half2); | ||
| 1087 | @@ -6664,14 +6663,14 @@ float3 __ovld __cnfn asinpi(float3 x); | ||
| 1088 | float4 __ovld __cnfn asinpi(float4 x); | ||
| 1089 | float8 __ovld __cnfn asinpi(float8 x); | ||
| 1090 | float16 __ovld __cnfn asinpi(float16 x); | ||
| 1091 | -#ifdef cl_khr_fp64 | ||
| 1092 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1093 | double __ovld __cnfn asinpi(double x); | ||
| 1094 | double2 __ovld __cnfn asinpi(double2 x); | ||
| 1095 | double3 __ovld __cnfn asinpi(double3 x); | ||
| 1096 | double4 __ovld __cnfn asinpi(double4 x); | ||
| 1097 | double8 __ovld __cnfn asinpi(double8 x); | ||
| 1098 | double16 __ovld __cnfn asinpi(double16 x); | ||
| 1099 | -#endif //cl_khr_fp64 | ||
| 1100 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1101 | #ifdef cl_khr_fp16 | ||
| 1102 | half __ovld __cnfn asinpi(half x); | ||
| 1103 | half2 __ovld __cnfn asinpi(half2 x); | ||
| 1104 | @@ -6690,14 +6689,14 @@ float3 __ovld __cnfn atan(float3 y_over_x); | ||
| 1105 | float4 __ovld __cnfn atan(float4 y_over_x); | ||
| 1106 | float8 __ovld __cnfn atan(float8 y_over_x); | ||
| 1107 | float16 __ovld __cnfn atan(float16 y_over_x); | ||
| 1108 | -#ifdef cl_khr_fp64 | ||
| 1109 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1110 | double __ovld __cnfn atan(double y_over_x); | ||
| 1111 | double2 __ovld __cnfn atan(double2 y_over_x); | ||
| 1112 | double3 __ovld __cnfn atan(double3 y_over_x); | ||
| 1113 | double4 __ovld __cnfn atan(double4 y_over_x); | ||
| 1114 | double8 __ovld __cnfn atan(double8 y_over_x); | ||
| 1115 | double16 __ovld __cnfn atan(double16 y_over_x); | ||
| 1116 | -#endif //cl_khr_fp64 | ||
| 1117 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1118 | #ifdef cl_khr_fp16 | ||
| 1119 | half __ovld __cnfn atan(half y_over_x); | ||
| 1120 | half2 __ovld __cnfn atan(half2 y_over_x); | ||
| 1121 | @@ -6716,14 +6715,14 @@ float3 __ovld __cnfn atan2(float3 y, float3 x); | ||
| 1122 | float4 __ovld __cnfn atan2(float4 y, float4 x); | ||
| 1123 | float8 __ovld __cnfn atan2(float8 y, float8 x); | ||
| 1124 | float16 __ovld __cnfn atan2(float16 y, float16 x); | ||
| 1125 | -#ifdef cl_khr_fp64 | ||
| 1126 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1127 | double __ovld __cnfn atan2(double y, double x); | ||
| 1128 | double2 __ovld __cnfn atan2(double2 y, double2 x); | ||
| 1129 | double3 __ovld __cnfn atan2(double3 y, double3 x); | ||
| 1130 | double4 __ovld __cnfn atan2(double4 y, double4 x); | ||
| 1131 | double8 __ovld __cnfn atan2(double8 y, double8 x); | ||
| 1132 | double16 __ovld __cnfn atan2(double16 y, double16 x); | ||
| 1133 | -#endif //cl_khr_fp64 | ||
| 1134 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1135 | #ifdef cl_khr_fp16 | ||
| 1136 | half __ovld __cnfn atan2(half y, half x); | ||
| 1137 | half2 __ovld __cnfn atan2(half2 y, half2 x); | ||
| 1138 | @@ -6742,14 +6741,14 @@ float3 __ovld __cnfn atanh(float3); | ||
| 1139 | float4 __ovld __cnfn atanh(float4); | ||
| 1140 | float8 __ovld __cnfn atanh(float8); | ||
| 1141 | float16 __ovld __cnfn atanh(float16); | ||
| 1142 | -#ifdef cl_khr_fp64 | ||
| 1143 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1144 | double __ovld __cnfn atanh(double); | ||
| 1145 | double2 __ovld __cnfn atanh(double2); | ||
| 1146 | double3 __ovld __cnfn atanh(double3); | ||
| 1147 | double4 __ovld __cnfn atanh(double4); | ||
| 1148 | double8 __ovld __cnfn atanh(double8); | ||
| 1149 | double16 __ovld __cnfn atanh(double16); | ||
| 1150 | -#endif //cl_khr_fp64 | ||
| 1151 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1152 | #ifdef cl_khr_fp16 | ||
| 1153 | half __ovld __cnfn atanh(half); | ||
| 1154 | half2 __ovld __cnfn atanh(half2); | ||
| 1155 | @@ -6768,14 +6767,14 @@ float3 __ovld __cnfn atanpi(float3 x); | ||
| 1156 | float4 __ovld __cnfn atanpi(float4 x); | ||
| 1157 | float8 __ovld __cnfn atanpi(float8 x); | ||
| 1158 | float16 __ovld __cnfn atanpi(float16 x); | ||
| 1159 | -#ifdef cl_khr_fp64 | ||
| 1160 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1161 | double __ovld __cnfn atanpi(double x); | ||
| 1162 | double2 __ovld __cnfn atanpi(double2 x); | ||
| 1163 | double3 __ovld __cnfn atanpi(double3 x); | ||
| 1164 | double4 __ovld __cnfn atanpi(double4 x); | ||
| 1165 | double8 __ovld __cnfn atanpi(double8 x); | ||
| 1166 | double16 __ovld __cnfn atanpi(double16 x); | ||
| 1167 | -#endif //cl_khr_fp64 | ||
| 1168 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1169 | #ifdef cl_khr_fp16 | ||
| 1170 | half __ovld __cnfn atanpi(half x); | ||
| 1171 | half2 __ovld __cnfn atanpi(half2 x); | ||
| 1172 | @@ -6794,14 +6793,14 @@ float3 __ovld __cnfn atan2pi(float3 y, float3 x); | ||
| 1173 | float4 __ovld __cnfn atan2pi(float4 y, float4 x); | ||
| 1174 | float8 __ovld __cnfn atan2pi(float8 y, float8 x); | ||
| 1175 | float16 __ovld __cnfn atan2pi(float16 y, float16 x); | ||
| 1176 | -#ifdef cl_khr_fp64 | ||
| 1177 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1178 | double __ovld __cnfn atan2pi(double y, double x); | ||
| 1179 | double2 __ovld __cnfn atan2pi(double2 y, double2 x); | ||
| 1180 | double3 __ovld __cnfn atan2pi(double3 y, double3 x); | ||
| 1181 | double4 __ovld __cnfn atan2pi(double4 y, double4 x); | ||
| 1182 | double8 __ovld __cnfn atan2pi(double8 y, double8 x); | ||
| 1183 | double16 __ovld __cnfn atan2pi(double16 y, double16 x); | ||
| 1184 | -#endif //cl_khr_fp64 | ||
| 1185 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1186 | #ifdef cl_khr_fp16 | ||
| 1187 | half __ovld __cnfn atan2pi(half y, half x); | ||
| 1188 | half2 __ovld __cnfn atan2pi(half2 y, half2 x); | ||
| 1189 | @@ -6820,14 +6819,14 @@ float3 __ovld __cnfn cbrt(float3); | ||
| 1190 | float4 __ovld __cnfn cbrt(float4); | ||
| 1191 | float8 __ovld __cnfn cbrt(float8); | ||
| 1192 | float16 __ovld __cnfn cbrt(float16); | ||
| 1193 | -#ifdef cl_khr_fp64 | ||
| 1194 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1195 | double __ovld __cnfn cbrt(double); | ||
| 1196 | double2 __ovld __cnfn cbrt(double2); | ||
| 1197 | double3 __ovld __cnfn cbrt(double3); | ||
| 1198 | double4 __ovld __cnfn cbrt(double4); | ||
| 1199 | double8 __ovld __cnfn cbrt(double8); | ||
| 1200 | double16 __ovld __cnfn cbrt(double16); | ||
| 1201 | -#endif //cl_khr_fp64 | ||
| 1202 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1203 | #ifdef cl_khr_fp16 | ||
| 1204 | half __ovld __cnfn cbrt(half); | ||
| 1205 | half2 __ovld __cnfn cbrt(half2); | ||
| 1206 | @@ -6847,14 +6846,14 @@ float3 __ovld __cnfn ceil(float3); | ||
| 1207 | float4 __ovld __cnfn ceil(float4); | ||
| 1208 | float8 __ovld __cnfn ceil(float8); | ||
| 1209 | float16 __ovld __cnfn ceil(float16); | ||
| 1210 | -#ifdef cl_khr_fp64 | ||
| 1211 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1212 | double __ovld __cnfn ceil(double); | ||
| 1213 | double2 __ovld __cnfn ceil(double2); | ||
| 1214 | double3 __ovld __cnfn ceil(double3); | ||
| 1215 | double4 __ovld __cnfn ceil(double4); | ||
| 1216 | double8 __ovld __cnfn ceil(double8); | ||
| 1217 | double16 __ovld __cnfn ceil(double16); | ||
| 1218 | -#endif //cl_khr_fp64 | ||
| 1219 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1220 | #ifdef cl_khr_fp16 | ||
| 1221 | half __ovld __cnfn ceil(half); | ||
| 1222 | half2 __ovld __cnfn ceil(half2); | ||
| 1223 | @@ -6873,14 +6872,14 @@ float3 __ovld __cnfn copysign(float3 x, float3 y); | ||
| 1224 | float4 __ovld __cnfn copysign(float4 x, float4 y); | ||
| 1225 | float8 __ovld __cnfn copysign(float8 x, float8 y); | ||
| 1226 | float16 __ovld __cnfn copysign(float16 x, float16 y); | ||
| 1227 | -#ifdef cl_khr_fp64 | ||
| 1228 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1229 | double __ovld __cnfn copysign(double x, double y); | ||
| 1230 | double2 __ovld __cnfn copysign(double2 x, double2 y); | ||
| 1231 | double3 __ovld __cnfn copysign(double3 x, double3 y); | ||
| 1232 | double4 __ovld __cnfn copysign(double4 x, double4 y); | ||
| 1233 | double8 __ovld __cnfn copysign(double8 x, double8 y); | ||
| 1234 | double16 __ovld __cnfn copysign(double16 x, double16 y); | ||
| 1235 | -#endif //cl_khr_fp64 | ||
| 1236 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1237 | #ifdef cl_khr_fp16 | ||
| 1238 | half __ovld __cnfn copysign(half x, half y); | ||
| 1239 | half2 __ovld __cnfn copysign(half2 x, half2 y); | ||
| 1240 | @@ -6899,14 +6898,14 @@ float3 __ovld __cnfn cos(float3); | ||
| 1241 | float4 __ovld __cnfn cos(float4); | ||
| 1242 | float8 __ovld __cnfn cos(float8); | ||
| 1243 | float16 __ovld __cnfn cos(float16); | ||
| 1244 | -#ifdef cl_khr_fp64 | ||
| 1245 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1246 | double __ovld __cnfn cos(double); | ||
| 1247 | double2 __ovld __cnfn cos(double2); | ||
| 1248 | double3 __ovld __cnfn cos(double3); | ||
| 1249 | double4 __ovld __cnfn cos(double4); | ||
| 1250 | double8 __ovld __cnfn cos(double8); | ||
| 1251 | double16 __ovld __cnfn cos(double16); | ||
| 1252 | -#endif //cl_khr_fp64 | ||
| 1253 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1254 | #ifdef cl_khr_fp16 | ||
| 1255 | half __ovld __cnfn cos(half); | ||
| 1256 | half2 __ovld __cnfn cos(half2); | ||
| 1257 | @@ -6925,14 +6924,14 @@ float3 __ovld __cnfn cosh(float3); | ||
| 1258 | float4 __ovld __cnfn cosh(float4); | ||
| 1259 | float8 __ovld __cnfn cosh(float8); | ||
| 1260 | float16 __ovld __cnfn cosh(float16); | ||
| 1261 | -#ifdef cl_khr_fp64 | ||
| 1262 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1263 | double __ovld __cnfn cosh(double); | ||
| 1264 | double2 __ovld __cnfn cosh(double2); | ||
| 1265 | double3 __ovld __cnfn cosh(double3); | ||
| 1266 | double4 __ovld __cnfn cosh(double4); | ||
| 1267 | double8 __ovld __cnfn cosh(double8); | ||
| 1268 | double16 __ovld __cnfn cosh(double16); | ||
| 1269 | -#endif //cl_khr_fp64 | ||
| 1270 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1271 | #ifdef cl_khr_fp16 | ||
| 1272 | half __ovld __cnfn cosh(half); | ||
| 1273 | half2 __ovld __cnfn cosh(half2); | ||
| 1274 | @@ -6951,14 +6950,14 @@ float3 __ovld __cnfn cospi(float3 x); | ||
| 1275 | float4 __ovld __cnfn cospi(float4 x); | ||
| 1276 | float8 __ovld __cnfn cospi(float8 x); | ||
| 1277 | float16 __ovld __cnfn cospi(float16 x); | ||
| 1278 | -#ifdef cl_khr_fp64 | ||
| 1279 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1280 | double __ovld __cnfn cospi(double x); | ||
| 1281 | double2 __ovld __cnfn cospi(double2 x); | ||
| 1282 | double3 __ovld __cnfn cospi(double3 x); | ||
| 1283 | double4 __ovld __cnfn cospi(double4 x); | ||
| 1284 | double8 __ovld __cnfn cospi(double8 x); | ||
| 1285 | double16 __ovld __cnfn cospi(double16 x); | ||
| 1286 | -#endif //cl_khr_fp64 | ||
| 1287 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1288 | #ifdef cl_khr_fp16 | ||
| 1289 | half __ovld __cnfn cospi(half x); | ||
| 1290 | half2 __ovld __cnfn cospi(half2 x); | ||
| 1291 | @@ -6977,14 +6976,14 @@ float3 __ovld __cnfn erfc(float3); | ||
| 1292 | float4 __ovld __cnfn erfc(float4); | ||
| 1293 | float8 __ovld __cnfn erfc(float8); | ||
| 1294 | float16 __ovld __cnfn erfc(float16); | ||
| 1295 | -#ifdef cl_khr_fp64 | ||
| 1296 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1297 | double __ovld __cnfn erfc(double); | ||
| 1298 | double2 __ovld __cnfn erfc(double2); | ||
| 1299 | double3 __ovld __cnfn erfc(double3); | ||
| 1300 | double4 __ovld __cnfn erfc(double4); | ||
| 1301 | double8 __ovld __cnfn erfc(double8); | ||
| 1302 | double16 __ovld __cnfn erfc(double16); | ||
| 1303 | -#endif //cl_khr_fp64 | ||
| 1304 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1305 | #ifdef cl_khr_fp16 | ||
| 1306 | half __ovld __cnfn erfc(half); | ||
| 1307 | half2 __ovld __cnfn erfc(half2); | ||
| 1308 | @@ -7004,14 +7003,14 @@ float3 __ovld __cnfn erf(float3); | ||
| 1309 | float4 __ovld __cnfn erf(float4); | ||
| 1310 | float8 __ovld __cnfn erf(float8); | ||
| 1311 | float16 __ovld __cnfn erf(float16); | ||
| 1312 | -#ifdef cl_khr_fp64 | ||
| 1313 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1314 | double __ovld __cnfn erf(double); | ||
| 1315 | double2 __ovld __cnfn erf(double2); | ||
| 1316 | double3 __ovld __cnfn erf(double3); | ||
| 1317 | double4 __ovld __cnfn erf(double4); | ||
| 1318 | double8 __ovld __cnfn erf(double8); | ||
| 1319 | double16 __ovld __cnfn erf(double16); | ||
| 1320 | -#endif //cl_khr_fp64 | ||
| 1321 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1322 | #ifdef cl_khr_fp16 | ||
| 1323 | half __ovld __cnfn erf(half); | ||
| 1324 | half2 __ovld __cnfn erf(half2); | ||
| 1325 | @@ -7030,14 +7029,14 @@ float3 __ovld __cnfn exp(float3 x); | ||
| 1326 | float4 __ovld __cnfn exp(float4 x); | ||
| 1327 | float8 __ovld __cnfn exp(float8 x); | ||
| 1328 | float16 __ovld __cnfn exp(float16 x); | ||
| 1329 | -#ifdef cl_khr_fp64 | ||
| 1330 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1331 | double __ovld __cnfn exp(double x); | ||
| 1332 | double2 __ovld __cnfn exp(double2 x); | ||
| 1333 | double3 __ovld __cnfn exp(double3 x); | ||
| 1334 | double4 __ovld __cnfn exp(double4 x); | ||
| 1335 | double8 __ovld __cnfn exp(double8 x); | ||
| 1336 | double16 __ovld __cnfn exp(double16 x); | ||
| 1337 | -#endif //cl_khr_fp64 | ||
| 1338 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1339 | #ifdef cl_khr_fp16 | ||
| 1340 | half __ovld __cnfn exp(half x); | ||
| 1341 | half2 __ovld __cnfn exp(half2 x); | ||
| 1342 | @@ -7056,14 +7055,14 @@ float3 __ovld __cnfn exp2(float3); | ||
| 1343 | float4 __ovld __cnfn exp2(float4); | ||
| 1344 | float8 __ovld __cnfn exp2(float8); | ||
| 1345 | float16 __ovld __cnfn exp2(float16); | ||
| 1346 | -#ifdef cl_khr_fp64 | ||
| 1347 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1348 | double __ovld __cnfn exp2(double); | ||
| 1349 | double2 __ovld __cnfn exp2(double2); | ||
| 1350 | double3 __ovld __cnfn exp2(double3); | ||
| 1351 | double4 __ovld __cnfn exp2(double4); | ||
| 1352 | double8 __ovld __cnfn exp2(double8); | ||
| 1353 | double16 __ovld __cnfn exp2(double16); | ||
| 1354 | -#endif //cl_khr_fp64 | ||
| 1355 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1356 | #ifdef cl_khr_fp16 | ||
| 1357 | half __ovld __cnfn exp2(half); | ||
| 1358 | half2 __ovld __cnfn exp2(half2); | ||
| 1359 | @@ -7082,14 +7081,14 @@ float3 __ovld __cnfn exp10(float3); | ||
| 1360 | float4 __ovld __cnfn exp10(float4); | ||
| 1361 | float8 __ovld __cnfn exp10(float8); | ||
| 1362 | float16 __ovld __cnfn exp10(float16); | ||
| 1363 | -#ifdef cl_khr_fp64 | ||
| 1364 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1365 | double __ovld __cnfn exp10(double); | ||
| 1366 | double2 __ovld __cnfn exp10(double2); | ||
| 1367 | double3 __ovld __cnfn exp10(double3); | ||
| 1368 | double4 __ovld __cnfn exp10(double4); | ||
| 1369 | double8 __ovld __cnfn exp10(double8); | ||
| 1370 | double16 __ovld __cnfn exp10(double16); | ||
| 1371 | -#endif //cl_khr_fp64 | ||
| 1372 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1373 | #ifdef cl_khr_fp16 | ||
| 1374 | half __ovld __cnfn exp10(half); | ||
| 1375 | half2 __ovld __cnfn exp10(half2); | ||
| 1376 | @@ -7108,14 +7107,14 @@ float3 __ovld __cnfn expm1(float3 x); | ||
| 1377 | float4 __ovld __cnfn expm1(float4 x); | ||
| 1378 | float8 __ovld __cnfn expm1(float8 x); | ||
| 1379 | float16 __ovld __cnfn expm1(float16 x); | ||
| 1380 | -#ifdef cl_khr_fp64 | ||
| 1381 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1382 | double __ovld __cnfn expm1(double x); | ||
| 1383 | double2 __ovld __cnfn expm1(double2 x); | ||
| 1384 | double3 __ovld __cnfn expm1(double3 x); | ||
| 1385 | double4 __ovld __cnfn expm1(double4 x); | ||
| 1386 | double8 __ovld __cnfn expm1(double8 x); | ||
| 1387 | double16 __ovld __cnfn expm1(double16 x); | ||
| 1388 | -#endif //cl_khr_fp64 | ||
| 1389 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1390 | #ifdef cl_khr_fp16 | ||
| 1391 | half __ovld __cnfn expm1(half x); | ||
| 1392 | half2 __ovld __cnfn expm1(half2 x); | ||
| 1393 | @@ -7134,14 +7133,14 @@ float3 __ovld __cnfn fabs(float3); | ||
| 1394 | float4 __ovld __cnfn fabs(float4); | ||
| 1395 | float8 __ovld __cnfn fabs(float8); | ||
| 1396 | float16 __ovld __cnfn fabs(float16); | ||
| 1397 | -#ifdef cl_khr_fp64 | ||
| 1398 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1399 | double __ovld __cnfn fabs(double); | ||
| 1400 | double2 __ovld __cnfn fabs(double2); | ||
| 1401 | double3 __ovld __cnfn fabs(double3); | ||
| 1402 | double4 __ovld __cnfn fabs(double4); | ||
| 1403 | double8 __ovld __cnfn fabs(double8); | ||
| 1404 | double16 __ovld __cnfn fabs(double16); | ||
| 1405 | -#endif //cl_khr_fp64 | ||
| 1406 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1407 | #ifdef cl_khr_fp16 | ||
| 1408 | half __ovld __cnfn fabs(half); | ||
| 1409 | half2 __ovld __cnfn fabs(half2); | ||
| 1410 | @@ -7160,14 +7159,14 @@ float3 __ovld __cnfn fdim(float3 x, float3 y); | ||
| 1411 | float4 __ovld __cnfn fdim(float4 x, float4 y); | ||
| 1412 | float8 __ovld __cnfn fdim(float8 x, float8 y); | ||
| 1413 | float16 __ovld __cnfn fdim(float16 x, float16 y); | ||
| 1414 | -#ifdef cl_khr_fp64 | ||
| 1415 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1416 | double __ovld __cnfn fdim(double x, double y); | ||
| 1417 | double2 __ovld __cnfn fdim(double2 x, double2 y); | ||
| 1418 | double3 __ovld __cnfn fdim(double3 x, double3 y); | ||
| 1419 | double4 __ovld __cnfn fdim(double4 x, double4 y); | ||
| 1420 | double8 __ovld __cnfn fdim(double8 x, double8 y); | ||
| 1421 | double16 __ovld __cnfn fdim(double16 x, double16 y); | ||
| 1422 | -#endif //cl_khr_fp64 | ||
| 1423 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1424 | #ifdef cl_khr_fp16 | ||
| 1425 | half __ovld __cnfn fdim(half x, half y); | ||
| 1426 | half2 __ovld __cnfn fdim(half2 x, half2 y); | ||
| 1427 | @@ -7187,14 +7186,14 @@ float3 __ovld __cnfn floor(float3); | ||
| 1428 | float4 __ovld __cnfn floor(float4); | ||
| 1429 | float8 __ovld __cnfn floor(float8); | ||
| 1430 | float16 __ovld __cnfn floor(float16); | ||
| 1431 | -#ifdef cl_khr_fp64 | ||
| 1432 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1433 | double __ovld __cnfn floor(double); | ||
| 1434 | double2 __ovld __cnfn floor(double2); | ||
| 1435 | double3 __ovld __cnfn floor(double3); | ||
| 1436 | double4 __ovld __cnfn floor(double4); | ||
| 1437 | double8 __ovld __cnfn floor(double8); | ||
| 1438 | double16 __ovld __cnfn floor(double16); | ||
| 1439 | -#endif //cl_khr_fp64 | ||
| 1440 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1441 | #ifdef cl_khr_fp16 | ||
| 1442 | half __ovld __cnfn floor(half); | ||
| 1443 | half2 __ovld __cnfn floor(half2); | ||
| 1444 | @@ -7217,14 +7216,14 @@ float3 __ovld __cnfn fma(float3 a, float3 b, float3 c); | ||
| 1445 | float4 __ovld __cnfn fma(float4 a, float4 b, float4 c); | ||
| 1446 | float8 __ovld __cnfn fma(float8 a, float8 b, float8 c); | ||
| 1447 | float16 __ovld __cnfn fma(float16 a, float16 b, float16 c); | ||
| 1448 | -#ifdef cl_khr_fp64 | ||
| 1449 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1450 | double __ovld __cnfn fma(double a, double b, double c); | ||
| 1451 | double2 __ovld __cnfn fma(double2 a, double2 b, double2 c); | ||
| 1452 | double3 __ovld __cnfn fma(double3 a, double3 b, double3 c); | ||
| 1453 | double4 __ovld __cnfn fma(double4 a, double4 b, double4 c); | ||
| 1454 | double8 __ovld __cnfn fma(double8 a, double8 b, double8 c); | ||
| 1455 | double16 __ovld __cnfn fma(double16 a, double16 b, double16 c); | ||
| 1456 | -#endif //cl_khr_fp64 | ||
| 1457 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1458 | #ifdef cl_khr_fp16 | ||
| 1459 | half __ovld __cnfn fma(half a, half b, half c); | ||
| 1460 | half2 __ovld __cnfn fma(half2 a, half2 b, half2 c); | ||
| 1461 | @@ -7251,7 +7250,7 @@ float3 __ovld __cnfn fmax(float3 x, float y); | ||
| 1462 | float4 __ovld __cnfn fmax(float4 x, float y); | ||
| 1463 | float8 __ovld __cnfn fmax(float8 x, float y); | ||
| 1464 | float16 __ovld __cnfn fmax(float16 x, float y); | ||
| 1465 | -#ifdef cl_khr_fp64 | ||
| 1466 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1467 | double __ovld __cnfn fmax(double x, double y); | ||
| 1468 | double2 __ovld __cnfn fmax(double2 x, double2 y); | ||
| 1469 | double3 __ovld __cnfn fmax(double3 x, double3 y); | ||
| 1470 | @@ -7263,7 +7262,7 @@ double3 __ovld __cnfn fmax(double3 x, double y); | ||
| 1471 | double4 __ovld __cnfn fmax(double4 x, double y); | ||
| 1472 | double8 __ovld __cnfn fmax(double8 x, double y); | ||
| 1473 | double16 __ovld __cnfn fmax(double16 x, double y); | ||
| 1474 | -#endif //cl_khr_fp64 | ||
| 1475 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1476 | #ifdef cl_khr_fp16 | ||
| 1477 | half __ovld __cnfn fmax(half x, half y); | ||
| 1478 | half2 __ovld __cnfn fmax(half2 x, half2 y); | ||
| 1479 | @@ -7295,7 +7294,7 @@ float3 __ovld __cnfn fmin(float3 x, float y); | ||
| 1480 | float4 __ovld __cnfn fmin(float4 x, float y); | ||
| 1481 | float8 __ovld __cnfn fmin(float8 x, float y); | ||
| 1482 | float16 __ovld __cnfn fmin(float16 x, float y); | ||
| 1483 | -#ifdef cl_khr_fp64 | ||
| 1484 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1485 | double __ovld __cnfn fmin(double x, double y); | ||
| 1486 | double2 __ovld __cnfn fmin(double2 x, double2 y); | ||
| 1487 | double3 __ovld __cnfn fmin(double3 x, double3 y); | ||
| 1488 | @@ -7307,7 +7306,7 @@ double3 __ovld __cnfn fmin(double3 x, double y); | ||
| 1489 | double4 __ovld __cnfn fmin(double4 x, double y); | ||
| 1490 | double8 __ovld __cnfn fmin(double8 x, double y); | ||
| 1491 | double16 __ovld __cnfn fmin(double16 x, double y); | ||
| 1492 | -#endif //cl_khr_fp64 | ||
| 1493 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1494 | #ifdef cl_khr_fp16 | ||
| 1495 | half __ovld __cnfn fmin(half x, half y); | ||
| 1496 | half2 __ovld __cnfn fmin(half2 x, half2 y); | ||
| 1497 | @@ -7331,14 +7330,14 @@ float3 __ovld __cnfn fmod(float3 x, float3 y); | ||
| 1498 | float4 __ovld __cnfn fmod(float4 x, float4 y); | ||
| 1499 | float8 __ovld __cnfn fmod(float8 x, float8 y); | ||
| 1500 | float16 __ovld __cnfn fmod(float16 x, float16 y); | ||
| 1501 | -#ifdef cl_khr_fp64 | ||
| 1502 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1503 | double __ovld __cnfn fmod(double x, double y); | ||
| 1504 | double2 __ovld __cnfn fmod(double2 x, double2 y); | ||
| 1505 | double3 __ovld __cnfn fmod(double3 x, double3 y); | ||
| 1506 | double4 __ovld __cnfn fmod(double4 x, double4 y); | ||
| 1507 | double8 __ovld __cnfn fmod(double8 x, double8 y); | ||
| 1508 | double16 __ovld __cnfn fmod(double16 x, double16 y); | ||
| 1509 | -#endif //cl_khr_fp64 | ||
| 1510 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1511 | #ifdef cl_khr_fp16 | ||
| 1512 | half __ovld __cnfn fmod(half x, half y); | ||
| 1513 | half2 __ovld __cnfn fmod(half2 x, half2 y); | ||
| 1514 | @@ -7352,21 +7351,21 @@ half16 __ovld __cnfn fmod(half16 x, half16 y); | ||
| 1515 | * Returns fmin(x - floor (x), 0x1.fffffep-1f ). | ||
| 1516 | * floor(x) is returned in iptr. | ||
| 1517 | */ | ||
| 1518 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1519 | +#ifdef __opencl_c_generic_address_space | ||
| 1520 | float __ovld fract(float x, float *iptr); | ||
| 1521 | float2 __ovld fract(float2 x, float2 *iptr); | ||
| 1522 | float3 __ovld fract(float3 x, float3 *iptr); | ||
| 1523 | float4 __ovld fract(float4 x, float4 *iptr); | ||
| 1524 | float8 __ovld fract(float8 x, float8 *iptr); | ||
| 1525 | float16 __ovld fract(float16 x, float16 *iptr); | ||
| 1526 | -#ifdef cl_khr_fp64 | ||
| 1527 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1528 | double __ovld fract(double x, double *iptr); | ||
| 1529 | double2 __ovld fract(double2 x, double2 *iptr); | ||
| 1530 | double3 __ovld fract(double3 x, double3 *iptr); | ||
| 1531 | double4 __ovld fract(double4 x, double4 *iptr); | ||
| 1532 | double8 __ovld fract(double8 x, double8 *iptr); | ||
| 1533 | double16 __ovld fract(double16 x, double16 *iptr); | ||
| 1534 | -#endif //cl_khr_fp64 | ||
| 1535 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1536 | #ifdef cl_khr_fp16 | ||
| 1537 | half __ovld fract(half x, half *iptr); | ||
| 1538 | half2 __ovld fract(half2 x, half2 *iptr); | ||
| 1539 | @@ -7375,7 +7374,9 @@ half4 __ovld fract(half4 x, half4 *iptr); | ||
| 1540 | half8 __ovld fract(half8 x, half8 *iptr); | ||
| 1541 | half16 __ovld fract(half16 x, half16 *iptr); | ||
| 1542 | #endif //cl_khr_fp16 | ||
| 1543 | -#else | ||
| 1544 | +#endif //__opencl_c_generic_address_space | ||
| 1545 | + | ||
| 1546 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1547 | float __ovld fract(float x, __global float *iptr); | ||
| 1548 | float2 __ovld fract(float2 x, __global float2 *iptr); | ||
| 1549 | float3 __ovld fract(float3 x, __global float3 *iptr); | ||
| 1550 | @@ -7394,7 +7395,7 @@ float3 __ovld fract(float3 x, __private float3 *iptr); | ||
| 1551 | float4 __ovld fract(float4 x, __private float4 *iptr); | ||
| 1552 | float8 __ovld fract(float8 x, __private float8 *iptr); | ||
| 1553 | float16 __ovld fract(float16 x, __private float16 *iptr); | ||
| 1554 | -#ifdef cl_khr_fp64 | ||
| 1555 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1556 | double __ovld fract(double x, __global double *iptr); | ||
| 1557 | double2 __ovld fract(double2 x, __global double2 *iptr); | ||
| 1558 | double3 __ovld fract(double3 x, __global double3 *iptr); | ||
| 1559 | @@ -7413,7 +7414,7 @@ double3 __ovld fract(double3 x, __private double3 *iptr); | ||
| 1560 | double4 __ovld fract(double4 x, __private double4 *iptr); | ||
| 1561 | double8 __ovld fract(double8 x, __private double8 *iptr); | ||
| 1562 | double16 __ovld fract(double16 x, __private double16 *iptr); | ||
| 1563 | -#endif //cl_khr_fp64 | ||
| 1564 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1565 | #ifdef cl_khr_fp16 | ||
| 1566 | half __ovld fract(half x, __global half *iptr); | ||
| 1567 | half2 __ovld fract(half2 x, __global half2 *iptr); | ||
| 1568 | @@ -7434,29 +7435,29 @@ half4 __ovld fract(half4 x, __private half4 *iptr); | ||
| 1569 | half8 __ovld fract(half8 x, __private half8 *iptr); | ||
| 1570 | half16 __ovld fract(half16 x, __private half16 *iptr); | ||
| 1571 | #endif //cl_khr_fp16 | ||
| 1572 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1573 | - | ||
| 1574 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1575 | + //! CL_VERSION_2_0) | ||
| 1576 | /** | ||
| 1577 | * Extract mantissa and exponent from x. For each | ||
| 1578 | * component the mantissa returned is a float with | ||
| 1579 | * magnitude in the interval [1/2, 1) or 0. Each | ||
| 1580 | * component of x equals mantissa returned * 2^exp. | ||
| 1581 | */ | ||
| 1582 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1583 | +#ifdef __opencl_c_generic_address_space | ||
| 1584 | float __ovld frexp(float x, int *exp); | ||
| 1585 | float2 __ovld frexp(float2 x, int2 *exp); | ||
| 1586 | float3 __ovld frexp(float3 x, int3 *exp); | ||
| 1587 | float4 __ovld frexp(float4 x, int4 *exp); | ||
| 1588 | float8 __ovld frexp(float8 x, int8 *exp); | ||
| 1589 | float16 __ovld frexp(float16 x, int16 *exp); | ||
| 1590 | -#ifdef cl_khr_fp64 | ||
| 1591 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1592 | double __ovld frexp(double x, int *exp); | ||
| 1593 | double2 __ovld frexp(double2 x, int2 *exp); | ||
| 1594 | double3 __ovld frexp(double3 x, int3 *exp); | ||
| 1595 | double4 __ovld frexp(double4 x, int4 *exp); | ||
| 1596 | double8 __ovld frexp(double8 x, int8 *exp); | ||
| 1597 | double16 __ovld frexp(double16 x, int16 *exp); | ||
| 1598 | -#endif //cl_khr_fp64 | ||
| 1599 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1600 | #ifdef cl_khr_fp16 | ||
| 1601 | half __ovld frexp(half x, int *exp); | ||
| 1602 | half2 __ovld frexp(half2 x, int2 *exp); | ||
| 1603 | @@ -7465,7 +7466,9 @@ half4 __ovld frexp(half4 x, int4 *exp); | ||
| 1604 | half8 __ovld frexp(half8 x, int8 *exp); | ||
| 1605 | half16 __ovld frexp(half16 x, int16 *exp); | ||
| 1606 | #endif //cl_khr_fp16 | ||
| 1607 | -#else | ||
| 1608 | +#endif //__opencl_c_generic_address_space | ||
| 1609 | + | ||
| 1610 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1611 | float __ovld frexp(float x, __global int *exp); | ||
| 1612 | float2 __ovld frexp(float2 x, __global int2 *exp); | ||
| 1613 | float3 __ovld frexp(float3 x, __global int3 *exp); | ||
| 1614 | @@ -7484,7 +7487,7 @@ float3 __ovld frexp(float3 x, __private int3 *exp); | ||
| 1615 | float4 __ovld frexp(float4 x, __private int4 *exp); | ||
| 1616 | float8 __ovld frexp(float8 x, __private int8 *exp); | ||
| 1617 | float16 __ovld frexp(float16 x, __private int16 *exp); | ||
| 1618 | -#ifdef cl_khr_fp64 | ||
| 1619 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1620 | double __ovld frexp(double x, __global int *exp); | ||
| 1621 | double2 __ovld frexp(double2 x, __global int2 *exp); | ||
| 1622 | double3 __ovld frexp(double3 x, __global int3 *exp); | ||
| 1623 | @@ -7503,7 +7506,7 @@ double3 __ovld frexp(double3 x, __private int3 *exp); | ||
| 1624 | double4 __ovld frexp(double4 x, __private int4 *exp); | ||
| 1625 | double8 __ovld frexp(double8 x, __private int8 *exp); | ||
| 1626 | double16 __ovld frexp(double16 x, __private int16 *exp); | ||
| 1627 | -#endif //cl_khr_fp64 | ||
| 1628 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1629 | #ifdef cl_khr_fp16 | ||
| 1630 | half __ovld frexp(half x, __global int *exp); | ||
| 1631 | half2 __ovld frexp(half2 x, __global int2 *exp); | ||
| 1632 | @@ -7524,7 +7527,8 @@ half4 __ovld frexp(half4 x, __private int4 *exp); | ||
| 1633 | half8 __ovld frexp(half8 x, __private int8 *exp); | ||
| 1634 | half16 __ovld frexp(half16 x, __private int16 *exp); | ||
| 1635 | #endif //cl_khr_fp16 | ||
| 1636 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1637 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1638 | + //! CL_VERSION_2_0) | ||
| 1639 | |||
| 1640 | /** | ||
| 1641 | * Compute the value of the square root of x^2 + y^2 | ||
| 1642 | @@ -7536,14 +7540,14 @@ float3 __ovld __cnfn hypot(float3 x, float3 y); | ||
| 1643 | float4 __ovld __cnfn hypot(float4 x, float4 y); | ||
| 1644 | float8 __ovld __cnfn hypot(float8 x, float8 y); | ||
| 1645 | float16 __ovld __cnfn hypot(float16 x, float16 y); | ||
| 1646 | -#ifdef cl_khr_fp64 | ||
| 1647 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1648 | double __ovld __cnfn hypot(double x, double y); | ||
| 1649 | double2 __ovld __cnfn hypot(double2 x, double2 y); | ||
| 1650 | double3 __ovld __cnfn hypot(double3 x, double3 y); | ||
| 1651 | double4 __ovld __cnfn hypot(double4 x, double4 y); | ||
| 1652 | double8 __ovld __cnfn hypot(double8 x, double8 y); | ||
| 1653 | double16 __ovld __cnfn hypot(double16 x, double16 y); | ||
| 1654 | -#endif //cl_khr_fp64 | ||
| 1655 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1656 | #ifdef cl_khr_fp16 | ||
| 1657 | half __ovld __cnfn hypot(half x, half y); | ||
| 1658 | half2 __ovld __cnfn hypot(half2 x, half2 y); | ||
| 1659 | @@ -7562,14 +7566,14 @@ int3 __ovld __cnfn ilogb(float3 x); | ||
| 1660 | int4 __ovld __cnfn ilogb(float4 x); | ||
| 1661 | int8 __ovld __cnfn ilogb(float8 x); | ||
| 1662 | int16 __ovld __cnfn ilogb(float16 x); | ||
| 1663 | -#ifdef cl_khr_fp64 | ||
| 1664 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1665 | int __ovld __cnfn ilogb(double x); | ||
| 1666 | int2 __ovld __cnfn ilogb(double2 x); | ||
| 1667 | int3 __ovld __cnfn ilogb(double3 x); | ||
| 1668 | int4 __ovld __cnfn ilogb(double4 x); | ||
| 1669 | int8 __ovld __cnfn ilogb(double8 x); | ||
| 1670 | int16 __ovld __cnfn ilogb(double16 x); | ||
| 1671 | -#endif //cl_khr_fp64 | ||
| 1672 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1673 | #ifdef cl_khr_fp16 | ||
| 1674 | int __ovld __cnfn ilogb(half x); | ||
| 1675 | int2 __ovld __cnfn ilogb(half2 x); | ||
| 1676 | @@ -7593,7 +7597,7 @@ float3 __ovld __cnfn ldexp(float3 x, int n); | ||
| 1677 | float4 __ovld __cnfn ldexp(float4 x, int n); | ||
| 1678 | float8 __ovld __cnfn ldexp(float8 x, int n); | ||
| 1679 | float16 __ovld __cnfn ldexp(float16 x, int n); | ||
| 1680 | -#ifdef cl_khr_fp64 | ||
| 1681 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1682 | double __ovld __cnfn ldexp(double x, int n); | ||
| 1683 | double2 __ovld __cnfn ldexp(double2 x, int2 n); | ||
| 1684 | double3 __ovld __cnfn ldexp(double3 x, int3 n); | ||
| 1685 | @@ -7605,7 +7609,7 @@ double3 __ovld __cnfn ldexp(double3 x, int n); | ||
| 1686 | double4 __ovld __cnfn ldexp(double4 x, int n); | ||
| 1687 | double8 __ovld __cnfn ldexp(double8 x, int n); | ||
| 1688 | double16 __ovld __cnfn ldexp(double16 x, int n); | ||
| 1689 | -#endif //cl_khr_fp64 | ||
| 1690 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1691 | #ifdef cl_khr_fp16 | ||
| 1692 | half __ovld __cnfn ldexp(half x, int n); | ||
| 1693 | half2 __ovld __cnfn ldexp(half2 x, int2 n); | ||
| 1694 | @@ -7632,14 +7636,14 @@ float3 __ovld __cnfn lgamma(float3 x); | ||
| 1695 | float4 __ovld __cnfn lgamma(float4 x); | ||
| 1696 | float8 __ovld __cnfn lgamma(float8 x); | ||
| 1697 | float16 __ovld __cnfn lgamma(float16 x); | ||
| 1698 | -#ifdef cl_khr_fp64 | ||
| 1699 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1700 | double __ovld __cnfn lgamma(double x); | ||
| 1701 | double2 __ovld __cnfn lgamma(double2 x); | ||
| 1702 | double3 __ovld __cnfn lgamma(double3 x); | ||
| 1703 | double4 __ovld __cnfn lgamma(double4 x); | ||
| 1704 | double8 __ovld __cnfn lgamma(double8 x); | ||
| 1705 | double16 __ovld __cnfn lgamma(double16 x); | ||
| 1706 | -#endif //cl_khr_fp64 | ||
| 1707 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1708 | #ifdef cl_khr_fp16 | ||
| 1709 | half __ovld __cnfn lgamma(half x); | ||
| 1710 | half2 __ovld __cnfn lgamma(half2 x); | ||
| 1711 | @@ -7649,21 +7653,21 @@ half8 __ovld __cnfn lgamma(half8 x); | ||
| 1712 | half16 __ovld __cnfn lgamma(half16 x); | ||
| 1713 | #endif //cl_khr_fp16 | ||
| 1714 | |||
| 1715 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1716 | +#ifdef __opencl_c_generic_address_space | ||
| 1717 | float __ovld lgamma_r(float x, int *signp); | ||
| 1718 | float2 __ovld lgamma_r(float2 x, int2 *signp); | ||
| 1719 | float3 __ovld lgamma_r(float3 x, int3 *signp); | ||
| 1720 | float4 __ovld lgamma_r(float4 x, int4 *signp); | ||
| 1721 | float8 __ovld lgamma_r(float8 x, int8 *signp); | ||
| 1722 | float16 __ovld lgamma_r(float16 x, int16 *signp); | ||
| 1723 | -#ifdef cl_khr_fp64 | ||
| 1724 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1725 | double __ovld lgamma_r(double x, int *signp); | ||
| 1726 | double2 __ovld lgamma_r(double2 x, int2 *signp); | ||
| 1727 | double3 __ovld lgamma_r(double3 x, int3 *signp); | ||
| 1728 | double4 __ovld lgamma_r(double4 x, int4 *signp); | ||
| 1729 | double8 __ovld lgamma_r(double8 x, int8 *signp); | ||
| 1730 | double16 __ovld lgamma_r(double16 x, int16 *signp); | ||
| 1731 | -#endif //cl_khr_fp64 | ||
| 1732 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1733 | #ifdef cl_khr_fp16 | ||
| 1734 | half __ovld lgamma_r(half x, int *signp); | ||
| 1735 | half2 __ovld lgamma_r(half2 x, int2 *signp); | ||
| 1736 | @@ -7672,7 +7676,9 @@ half4 __ovld lgamma_r(half4 x, int4 *signp); | ||
| 1737 | half8 __ovld lgamma_r(half8 x, int8 *signp); | ||
| 1738 | half16 __ovld lgamma_r(half16 x, int16 *signp); | ||
| 1739 | #endif //cl_khr_fp16 | ||
| 1740 | -#else | ||
| 1741 | +#endif //__opencl_c_generic_address_space | ||
| 1742 | + | ||
| 1743 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1744 | float __ovld lgamma_r(float x, __global int *signp); | ||
| 1745 | float2 __ovld lgamma_r(float2 x, __global int2 *signp); | ||
| 1746 | float3 __ovld lgamma_r(float3 x, __global int3 *signp); | ||
| 1747 | @@ -7691,7 +7697,7 @@ float3 __ovld lgamma_r(float3 x, __private int3 *signp); | ||
| 1748 | float4 __ovld lgamma_r(float4 x, __private int4 *signp); | ||
| 1749 | float8 __ovld lgamma_r(float8 x, __private int8 *signp); | ||
| 1750 | float16 __ovld lgamma_r(float16 x, __private int16 *signp); | ||
| 1751 | -#ifdef cl_khr_fp64 | ||
| 1752 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1753 | double __ovld lgamma_r(double x, __global int *signp); | ||
| 1754 | double2 __ovld lgamma_r(double2 x, __global int2 *signp); | ||
| 1755 | double3 __ovld lgamma_r(double3 x, __global int3 *signp); | ||
| 1756 | @@ -7710,7 +7716,7 @@ double3 __ovld lgamma_r(double3 x, __private int3 *signp); | ||
| 1757 | double4 __ovld lgamma_r(double4 x, __private int4 *signp); | ||
| 1758 | double8 __ovld lgamma_r(double8 x, __private int8 *signp); | ||
| 1759 | double16 __ovld lgamma_r(double16 x, __private int16 *signp); | ||
| 1760 | -#endif //cl_khr_fp64 | ||
| 1761 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1762 | #ifdef cl_khr_fp16 | ||
| 1763 | half __ovld lgamma_r(half x, __global int *signp); | ||
| 1764 | half2 __ovld lgamma_r(half2 x, __global int2 *signp); | ||
| 1765 | @@ -7731,8 +7737,8 @@ half4 __ovld lgamma_r(half4 x, __private int4 *signp); | ||
| 1766 | half8 __ovld lgamma_r(half8 x, __private int8 *signp); | ||
| 1767 | half16 __ovld lgamma_r(half16 x, __private int16 *signp); | ||
| 1768 | #endif //cl_khr_fp16 | ||
| 1769 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1770 | - | ||
| 1771 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1772 | + //! CL_VERSION_2_0) | ||
| 1773 | /** | ||
| 1774 | * Compute natural logarithm. | ||
| 1775 | */ | ||
| 1776 | @@ -7742,14 +7748,14 @@ float3 __ovld __cnfn log(float3); | ||
| 1777 | float4 __ovld __cnfn log(float4); | ||
| 1778 | float8 __ovld __cnfn log(float8); | ||
| 1779 | float16 __ovld __cnfn log(float16); | ||
| 1780 | -#ifdef cl_khr_fp64 | ||
| 1781 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1782 | double __ovld __cnfn log(double); | ||
| 1783 | double2 __ovld __cnfn log(double2); | ||
| 1784 | double3 __ovld __cnfn log(double3); | ||
| 1785 | double4 __ovld __cnfn log(double4); | ||
| 1786 | double8 __ovld __cnfn log(double8); | ||
| 1787 | double16 __ovld __cnfn log(double16); | ||
| 1788 | -#endif //cl_khr_fp64 | ||
| 1789 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1790 | #ifdef cl_khr_fp16 | ||
| 1791 | half __ovld __cnfn log(half); | ||
| 1792 | half2 __ovld __cnfn log(half2); | ||
| 1793 | @@ -7760,7 +7766,7 @@ half16 __ovld __cnfn log(half16); | ||
| 1794 | #endif //cl_khr_fp16 | ||
| 1795 | |||
| 1796 | /** | ||
| 1797 | - * Compute a base 2 logarithm. | ||
| 1798 | + * Compute a base 2 logarithm | ||
| 1799 | */ | ||
| 1800 | float __ovld __cnfn log2(float); | ||
| 1801 | float2 __ovld __cnfn log2(float2); | ||
| 1802 | @@ -7768,14 +7774,14 @@ float3 __ovld __cnfn log2(float3); | ||
| 1803 | float4 __ovld __cnfn log2(float4); | ||
| 1804 | float8 __ovld __cnfn log2(float8); | ||
| 1805 | float16 __ovld __cnfn log2(float16); | ||
| 1806 | -#ifdef cl_khr_fp64 | ||
| 1807 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1808 | double __ovld __cnfn log2(double); | ||
| 1809 | double2 __ovld __cnfn log2(double2); | ||
| 1810 | double3 __ovld __cnfn log2(double3); | ||
| 1811 | double4 __ovld __cnfn log2(double4); | ||
| 1812 | double8 __ovld __cnfn log2(double8); | ||
| 1813 | double16 __ovld __cnfn log2(double16); | ||
| 1814 | -#endif //cl_khr_fp64 | ||
| 1815 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1816 | #ifdef cl_khr_fp16 | ||
| 1817 | half __ovld __cnfn log2(half); | ||
| 1818 | half2 __ovld __cnfn log2(half2); | ||
| 1819 | @@ -7794,14 +7800,14 @@ float3 __ovld __cnfn log10(float3); | ||
| 1820 | float4 __ovld __cnfn log10(float4); | ||
| 1821 | float8 __ovld __cnfn log10(float8); | ||
| 1822 | float16 __ovld __cnfn log10(float16); | ||
| 1823 | -#ifdef cl_khr_fp64 | ||
| 1824 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1825 | double __ovld __cnfn log10(double); | ||
| 1826 | double2 __ovld __cnfn log10(double2); | ||
| 1827 | double3 __ovld __cnfn log10(double3); | ||
| 1828 | double4 __ovld __cnfn log10(double4); | ||
| 1829 | double8 __ovld __cnfn log10(double8); | ||
| 1830 | double16 __ovld __cnfn log10(double16); | ||
| 1831 | -#endif //cl_khr_fp64 | ||
| 1832 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1833 | #ifdef cl_khr_fp16 | ||
| 1834 | half __ovld __cnfn log10(half); | ||
| 1835 | half2 __ovld __cnfn log10(half2); | ||
| 1836 | @@ -7820,14 +7826,14 @@ float3 __ovld __cnfn log1p(float3 x); | ||
| 1837 | float4 __ovld __cnfn log1p(float4 x); | ||
| 1838 | float8 __ovld __cnfn log1p(float8 x); | ||
| 1839 | float16 __ovld __cnfn log1p(float16 x); | ||
| 1840 | -#ifdef cl_khr_fp64 | ||
| 1841 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1842 | double __ovld __cnfn log1p(double x); | ||
| 1843 | double2 __ovld __cnfn log1p(double2 x); | ||
| 1844 | double3 __ovld __cnfn log1p(double3 x); | ||
| 1845 | double4 __ovld __cnfn log1p(double4 x); | ||
| 1846 | double8 __ovld __cnfn log1p(double8 x); | ||
| 1847 | double16 __ovld __cnfn log1p(double16 x); | ||
| 1848 | -#endif //cl_khr_fp64 | ||
| 1849 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1850 | #ifdef cl_khr_fp16 | ||
| 1851 | half __ovld __cnfn log1p(half x); | ||
| 1852 | half2 __ovld __cnfn log1p(half2 x); | ||
| 1853 | @@ -7847,14 +7853,14 @@ float3 __ovld __cnfn logb(float3 x); | ||
| 1854 | float4 __ovld __cnfn logb(float4 x); | ||
| 1855 | float8 __ovld __cnfn logb(float8 x); | ||
| 1856 | float16 __ovld __cnfn logb(float16 x); | ||
| 1857 | -#ifdef cl_khr_fp64 | ||
| 1858 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1859 | double __ovld __cnfn logb(double x); | ||
| 1860 | double2 __ovld __cnfn logb(double2 x); | ||
| 1861 | double3 __ovld __cnfn logb(double3 x); | ||
| 1862 | double4 __ovld __cnfn logb(double4 x); | ||
| 1863 | double8 __ovld __cnfn logb(double8 x); | ||
| 1864 | double16 __ovld __cnfn logb(double16 x); | ||
| 1865 | -#endif //cl_khr_fp64 | ||
| 1866 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1867 | #ifdef cl_khr_fp16 | ||
| 1868 | half __ovld __cnfn logb(half x); | ||
| 1869 | half2 __ovld __cnfn logb(half2 x); | ||
| 1870 | @@ -7877,14 +7883,14 @@ float3 __ovld __cnfn mad(float3 a, float3 b, float3 c); | ||
| 1871 | float4 __ovld __cnfn mad(float4 a, float4 b, float4 c); | ||
| 1872 | float8 __ovld __cnfn mad(float8 a, float8 b, float8 c); | ||
| 1873 | float16 __ovld __cnfn mad(float16 a, float16 b, float16 c); | ||
| 1874 | -#ifdef cl_khr_fp64 | ||
| 1875 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1876 | double __ovld __cnfn mad(double a, double b, double c); | ||
| 1877 | double2 __ovld __cnfn mad(double2 a, double2 b, double2 c); | ||
| 1878 | double3 __ovld __cnfn mad(double3 a, double3 b, double3 c); | ||
| 1879 | double4 __ovld __cnfn mad(double4 a, double4 b, double4 c); | ||
| 1880 | double8 __ovld __cnfn mad(double8 a, double8 b, double8 c); | ||
| 1881 | double16 __ovld __cnfn mad(double16 a, double16 b, double16 c); | ||
| 1882 | -#endif //cl_khr_fp64 | ||
| 1883 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1884 | #ifdef cl_khr_fp16 | ||
| 1885 | half __ovld __cnfn mad(half a, half b, half c); | ||
| 1886 | half2 __ovld __cnfn mad(half2 a, half2 b, half2 c); | ||
| 1887 | @@ -7904,14 +7910,14 @@ float3 __ovld __cnfn maxmag(float3 x, float3 y); | ||
| 1888 | float4 __ovld __cnfn maxmag(float4 x, float4 y); | ||
| 1889 | float8 __ovld __cnfn maxmag(float8 x, float8 y); | ||
| 1890 | float16 __ovld __cnfn maxmag(float16 x, float16 y); | ||
| 1891 | -#ifdef cl_khr_fp64 | ||
| 1892 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1893 | double __ovld __cnfn maxmag(double x, double y); | ||
| 1894 | double2 __ovld __cnfn maxmag(double2 x, double2 y); | ||
| 1895 | double3 __ovld __cnfn maxmag(double3 x, double3 y); | ||
| 1896 | double4 __ovld __cnfn maxmag(double4 x, double4 y); | ||
| 1897 | double8 __ovld __cnfn maxmag(double8 x, double8 y); | ||
| 1898 | double16 __ovld __cnfn maxmag(double16 x, double16 y); | ||
| 1899 | -#endif //cl_khr_fp64 | ||
| 1900 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1901 | #ifdef cl_khr_fp16 | ||
| 1902 | half __ovld __cnfn maxmag(half x, half y); | ||
| 1903 | half2 __ovld __cnfn maxmag(half2 x, half2 y); | ||
| 1904 | @@ -7931,14 +7937,14 @@ float3 __ovld __cnfn minmag(float3 x, float3 y); | ||
| 1905 | float4 __ovld __cnfn minmag(float4 x, float4 y); | ||
| 1906 | float8 __ovld __cnfn minmag(float8 x, float8 y); | ||
| 1907 | float16 __ovld __cnfn minmag(float16 x, float16 y); | ||
| 1908 | -#ifdef cl_khr_fp64 | ||
| 1909 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1910 | double __ovld __cnfn minmag(double x, double y); | ||
| 1911 | double2 __ovld __cnfn minmag(double2 x, double2 y); | ||
| 1912 | double3 __ovld __cnfn minmag(double3 x, double3 y); | ||
| 1913 | double4 __ovld __cnfn minmag(double4 x, double4 y); | ||
| 1914 | double8 __ovld __cnfn minmag(double8 x, double8 y); | ||
| 1915 | double16 __ovld __cnfn minmag(double16 x, double16 y); | ||
| 1916 | -#endif //cl_khr_fp64 | ||
| 1917 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1918 | #ifdef cl_khr_fp16 | ||
| 1919 | half __ovld __cnfn minmag(half x, half y); | ||
| 1920 | half2 __ovld __cnfn minmag(half2 x, half2 y); | ||
| 1921 | @@ -7955,21 +7961,21 @@ half16 __ovld __cnfn minmag(half16 x, half16 y); | ||
| 1922 | * the argument. It stores the integral part in the object | ||
| 1923 | * pointed to by iptr. | ||
| 1924 | */ | ||
| 1925 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1926 | +#ifdef __opencl_c_generic_address_space | ||
| 1927 | float __ovld modf(float x, float *iptr); | ||
| 1928 | float2 __ovld modf(float2 x, float2 *iptr); | ||
| 1929 | float3 __ovld modf(float3 x, float3 *iptr); | ||
| 1930 | float4 __ovld modf(float4 x, float4 *iptr); | ||
| 1931 | float8 __ovld modf(float8 x, float8 *iptr); | ||
| 1932 | float16 __ovld modf(float16 x, float16 *iptr); | ||
| 1933 | -#ifdef cl_khr_fp64 | ||
| 1934 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1935 | double __ovld modf(double x, double *iptr); | ||
| 1936 | double2 __ovld modf(double2 x, double2 *iptr); | ||
| 1937 | double3 __ovld modf(double3 x, double3 *iptr); | ||
| 1938 | double4 __ovld modf(double4 x, double4 *iptr); | ||
| 1939 | double8 __ovld modf(double8 x, double8 *iptr); | ||
| 1940 | double16 __ovld modf(double16 x, double16 *iptr); | ||
| 1941 | -#endif //cl_khr_fp64 | ||
| 1942 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1943 | #ifdef cl_khr_fp16 | ||
| 1944 | half __ovld modf(half x, half *iptr); | ||
| 1945 | half2 __ovld modf(half2 x, half2 *iptr); | ||
| 1946 | @@ -7978,7 +7984,9 @@ half4 __ovld modf(half4 x, half4 *iptr); | ||
| 1947 | half8 __ovld modf(half8 x, half8 *iptr); | ||
| 1948 | half16 __ovld modf(half16 x, half16 *iptr); | ||
| 1949 | #endif //cl_khr_fp16 | ||
| 1950 | -#else | ||
| 1951 | +#endif //__opencl_c_generic_address_space | ||
| 1952 | + | ||
| 1953 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 1954 | float __ovld modf(float x, __global float *iptr); | ||
| 1955 | float2 __ovld modf(float2 x, __global float2 *iptr); | ||
| 1956 | float3 __ovld modf(float3 x, __global float3 *iptr); | ||
| 1957 | @@ -7997,7 +8005,7 @@ float3 __ovld modf(float3 x, __private float3 *iptr); | ||
| 1958 | float4 __ovld modf(float4 x, __private float4 *iptr); | ||
| 1959 | float8 __ovld modf(float8 x, __private float8 *iptr); | ||
| 1960 | float16 __ovld modf(float16 x, __private float16 *iptr); | ||
| 1961 | -#ifdef cl_khr_fp64 | ||
| 1962 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1963 | double __ovld modf(double x, __global double *iptr); | ||
| 1964 | double2 __ovld modf(double2 x, __global double2 *iptr); | ||
| 1965 | double3 __ovld modf(double3 x, __global double3 *iptr); | ||
| 1966 | @@ -8016,7 +8024,7 @@ double3 __ovld modf(double3 x, __private double3 *iptr); | ||
| 1967 | double4 __ovld modf(double4 x, __private double4 *iptr); | ||
| 1968 | double8 __ovld modf(double8 x, __private double8 *iptr); | ||
| 1969 | double16 __ovld modf(double16 x, __private double16 *iptr); | ||
| 1970 | -#endif //cl_khr_fp64 | ||
| 1971 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1972 | #ifdef cl_khr_fp16 | ||
| 1973 | half __ovld modf(half x, __global half *iptr); | ||
| 1974 | half2 __ovld modf(half2 x, __global half2 *iptr); | ||
| 1975 | @@ -8037,7 +8045,8 @@ half4 __ovld modf(half4 x, __private half4 *iptr); | ||
| 1976 | half8 __ovld modf(half8 x, __private half8 *iptr); | ||
| 1977 | half16 __ovld modf(half16 x, __private half16 *iptr); | ||
| 1978 | #endif //cl_khr_fp16 | ||
| 1979 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 1980 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 1981 | + //! CL_VERSION_2_0) | ||
| 1982 | |||
| 1983 | /** | ||
| 1984 | * Returns a quiet NaN. The nancode may be placed | ||
| 1985 | @@ -8049,14 +8058,14 @@ float3 __ovld __cnfn nan(uint3 nancode); | ||
| 1986 | float4 __ovld __cnfn nan(uint4 nancode); | ||
| 1987 | float8 __ovld __cnfn nan(uint8 nancode); | ||
| 1988 | float16 __ovld __cnfn nan(uint16 nancode); | ||
| 1989 | -#ifdef cl_khr_fp64 | ||
| 1990 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1991 | double __ovld __cnfn nan(ulong nancode); | ||
| 1992 | double2 __ovld __cnfn nan(ulong2 nancode); | ||
| 1993 | double3 __ovld __cnfn nan(ulong3 nancode); | ||
| 1994 | double4 __ovld __cnfn nan(ulong4 nancode); | ||
| 1995 | double8 __ovld __cnfn nan(ulong8 nancode); | ||
| 1996 | double16 __ovld __cnfn nan(ulong16 nancode); | ||
| 1997 | -#endif //cl_khr_fp64 | ||
| 1998 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 1999 | #ifdef cl_khr_fp16 | ||
| 2000 | half __ovld __cnfn nan(ushort nancode); | ||
| 2001 | half2 __ovld __cnfn nan(ushort2 nancode); | ||
| 2002 | @@ -8079,14 +8088,14 @@ float3 __ovld __cnfn nextafter(float3 x, float3 y); | ||
| 2003 | float4 __ovld __cnfn nextafter(float4 x, float4 y); | ||
| 2004 | float8 __ovld __cnfn nextafter(float8 x, float8 y); | ||
| 2005 | float16 __ovld __cnfn nextafter(float16 x, float16 y); | ||
| 2006 | -#ifdef cl_khr_fp64 | ||
| 2007 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2008 | double __ovld __cnfn nextafter(double x, double y); | ||
| 2009 | double2 __ovld __cnfn nextafter(double2 x, double2 y); | ||
| 2010 | double3 __ovld __cnfn nextafter(double3 x, double3 y); | ||
| 2011 | double4 __ovld __cnfn nextafter(double4 x, double4 y); | ||
| 2012 | double8 __ovld __cnfn nextafter(double8 x, double8 y); | ||
| 2013 | double16 __ovld __cnfn nextafter(double16 x, double16 y); | ||
| 2014 | -#endif //cl_khr_fp64 | ||
| 2015 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2016 | #ifdef cl_khr_fp16 | ||
| 2017 | half __ovld __cnfn nextafter(half x, half y); | ||
| 2018 | half2 __ovld __cnfn nextafter(half2 x, half2 y); | ||
| 2019 | @@ -8105,14 +8114,14 @@ float3 __ovld __cnfn pow(float3 x, float3 y); | ||
| 2020 | float4 __ovld __cnfn pow(float4 x, float4 y); | ||
| 2021 | float8 __ovld __cnfn pow(float8 x, float8 y); | ||
| 2022 | float16 __ovld __cnfn pow(float16 x, float16 y); | ||
| 2023 | -#ifdef cl_khr_fp64 | ||
| 2024 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2025 | double __ovld __cnfn pow(double x, double y); | ||
| 2026 | double2 __ovld __cnfn pow(double2 x, double2 y); | ||
| 2027 | double3 __ovld __cnfn pow(double3 x, double3 y); | ||
| 2028 | double4 __ovld __cnfn pow(double4 x, double4 y); | ||
| 2029 | double8 __ovld __cnfn pow(double8 x, double8 y); | ||
| 2030 | double16 __ovld __cnfn pow(double16 x, double16 y); | ||
| 2031 | -#endif //cl_khr_fp64 | ||
| 2032 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2033 | #ifdef cl_khr_fp16 | ||
| 2034 | half __ovld __cnfn pow(half x, half y); | ||
| 2035 | half2 __ovld __cnfn pow(half2 x, half2 y); | ||
| 2036 | @@ -8131,14 +8140,14 @@ float3 __ovld __cnfn pown(float3 x, int3 y); | ||
| 2037 | float4 __ovld __cnfn pown(float4 x, int4 y); | ||
| 2038 | float8 __ovld __cnfn pown(float8 x, int8 y); | ||
| 2039 | float16 __ovld __cnfn pown(float16 x, int16 y); | ||
| 2040 | -#ifdef cl_khr_fp64 | ||
| 2041 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2042 | double __ovld __cnfn pown(double x, int y); | ||
| 2043 | double2 __ovld __cnfn pown(double2 x, int2 y); | ||
| 2044 | double3 __ovld __cnfn pown(double3 x, int3 y); | ||
| 2045 | double4 __ovld __cnfn pown(double4 x, int4 y); | ||
| 2046 | double8 __ovld __cnfn pown(double8 x, int8 y); | ||
| 2047 | double16 __ovld __cnfn pown(double16 x, int16 y); | ||
| 2048 | -#endif //cl_khr_fp64 | ||
| 2049 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2050 | #ifdef cl_khr_fp16 | ||
| 2051 | half __ovld __cnfn pown(half x, int y); | ||
| 2052 | half2 __ovld __cnfn pown(half2 x, int2 y); | ||
| 2053 | @@ -8157,14 +8166,14 @@ float3 __ovld __cnfn powr(float3 x, float3 y); | ||
| 2054 | float4 __ovld __cnfn powr(float4 x, float4 y); | ||
| 2055 | float8 __ovld __cnfn powr(float8 x, float8 y); | ||
| 2056 | float16 __ovld __cnfn powr(float16 x, float16 y); | ||
| 2057 | -#ifdef cl_khr_fp64 | ||
| 2058 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2059 | double __ovld __cnfn powr(double x, double y); | ||
| 2060 | double2 __ovld __cnfn powr(double2 x, double2 y); | ||
| 2061 | double3 __ovld __cnfn powr(double3 x, double3 y); | ||
| 2062 | double4 __ovld __cnfn powr(double4 x, double4 y); | ||
| 2063 | double8 __ovld __cnfn powr(double8 x, double8 y); | ||
| 2064 | double16 __ovld __cnfn powr(double16 x, double16 y); | ||
| 2065 | -#endif //cl_khr_fp64 | ||
| 2066 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2067 | #ifdef cl_khr_fp16 | ||
| 2068 | half __ovld __cnfn powr(half x, half y); | ||
| 2069 | half2 __ovld __cnfn powr(half2 x, half2 y); | ||
| 2070 | @@ -8186,14 +8195,14 @@ float3 __ovld __cnfn remainder(float3 x, float3 y); | ||
| 2071 | float4 __ovld __cnfn remainder(float4 x, float4 y); | ||
| 2072 | float8 __ovld __cnfn remainder(float8 x, float8 y); | ||
| 2073 | float16 __ovld __cnfn remainder(float16 x, float16 y); | ||
| 2074 | -#ifdef cl_khr_fp64 | ||
| 2075 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2076 | double __ovld __cnfn remainder(double x, double y); | ||
| 2077 | double2 __ovld __cnfn remainder(double2 x, double2 y); | ||
| 2078 | double3 __ovld __cnfn remainder(double3 x, double3 y); | ||
| 2079 | double4 __ovld __cnfn remainder(double4 x, double4 y); | ||
| 2080 | double8 __ovld __cnfn remainder(double8 x, double8 y); | ||
| 2081 | double16 __ovld __cnfn remainder(double16 x, double16 y); | ||
| 2082 | -#endif //cl_khr_fp64 | ||
| 2083 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2084 | #ifdef cl_khr_fp16 | ||
| 2085 | half __ovld __cnfn remainder(half x, half y); | ||
| 2086 | half2 __ovld __cnfn remainder(half2 x, half2 y); | ||
| 2087 | @@ -8215,21 +8224,21 @@ half16 __ovld __cnfn remainder(half16 x, half16 y); | ||
| 2088 | * sign as x/y. It stores this signed value in the object | ||
| 2089 | * pointed to by quo. | ||
| 2090 | */ | ||
| 2091 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2092 | +#ifdef __opencl_c_generic_address_space | ||
| 2093 | float __ovld remquo(float x, float y, int *quo); | ||
| 2094 | float2 __ovld remquo(float2 x, float2 y, int2 *quo); | ||
| 2095 | float3 __ovld remquo(float3 x, float3 y, int3 *quo); | ||
| 2096 | float4 __ovld remquo(float4 x, float4 y, int4 *quo); | ||
| 2097 | float8 __ovld remquo(float8 x, float8 y, int8 *quo); | ||
| 2098 | float16 __ovld remquo(float16 x, float16 y, int16 *quo); | ||
| 2099 | -#ifdef cl_khr_fp64 | ||
| 2100 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2101 | double __ovld remquo(double x, double y, int *quo); | ||
| 2102 | double2 __ovld remquo(double2 x, double2 y, int2 *quo); | ||
| 2103 | double3 __ovld remquo(double3 x, double3 y, int3 *quo); | ||
| 2104 | double4 __ovld remquo(double4 x, double4 y, int4 *quo); | ||
| 2105 | double8 __ovld remquo(double8 x, double8 y, int8 *quo); | ||
| 2106 | double16 __ovld remquo(double16 x, double16 y, int16 *quo); | ||
| 2107 | -#endif //cl_khr_fp64 | ||
| 2108 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2109 | #ifdef cl_khr_fp16 | ||
| 2110 | half __ovld remquo(half x, half y, int *quo); | ||
| 2111 | half2 __ovld remquo(half2 x, half2 y, int2 *quo); | ||
| 2112 | @@ -8237,9 +8246,10 @@ half3 __ovld remquo(half3 x, half3 y, int3 *quo); | ||
| 2113 | half4 __ovld remquo(half4 x, half4 y, int4 *quo); | ||
| 2114 | half8 __ovld remquo(half8 x, half8 y, int8 *quo); | ||
| 2115 | half16 __ovld remquo(half16 x, half16 y, int16 *quo); | ||
| 2116 | - | ||
| 2117 | #endif //cl_khr_fp16 | ||
| 2118 | -#else | ||
| 2119 | +#endif //__opencl_c_generic_address_space | ||
| 2120 | + | ||
| 2121 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 2122 | float __ovld remquo(float x, float y, __global int *quo); | ||
| 2123 | float2 __ovld remquo(float2 x, float2 y, __global int2 *quo); | ||
| 2124 | float3 __ovld remquo(float3 x, float3 y, __global int3 *quo); | ||
| 2125 | @@ -8258,7 +8268,7 @@ float3 __ovld remquo(float3 x, float3 y, __private int3 *quo); | ||
| 2126 | float4 __ovld remquo(float4 x, float4 y, __private int4 *quo); | ||
| 2127 | float8 __ovld remquo(float8 x, float8 y, __private int8 *quo); | ||
| 2128 | float16 __ovld remquo(float16 x, float16 y, __private int16 *quo); | ||
| 2129 | -#ifdef cl_khr_fp64 | ||
| 2130 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2131 | double __ovld remquo(double x, double y, __global int *quo); | ||
| 2132 | double2 __ovld remquo(double2 x, double2 y, __global int2 *quo); | ||
| 2133 | double3 __ovld remquo(double3 x, double3 y, __global int3 *quo); | ||
| 2134 | @@ -8277,7 +8287,7 @@ double3 __ovld remquo(double3 x, double3 y, __private int3 *quo); | ||
| 2135 | double4 __ovld remquo(double4 x, double4 y, __private int4 *quo); | ||
| 2136 | double8 __ovld remquo(double8 x, double8 y, __private int8 *quo); | ||
| 2137 | double16 __ovld remquo(double16 x, double16 y, __private int16 *quo); | ||
| 2138 | -#endif //cl_khr_fp64 | ||
| 2139 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2140 | #ifdef cl_khr_fp16 | ||
| 2141 | half __ovld remquo(half x, half y, __global int *quo); | ||
| 2142 | half2 __ovld remquo(half2 x, half2 y, __global int2 *quo); | ||
| 2143 | @@ -8298,7 +8308,8 @@ half4 __ovld remquo(half4 x, half4 y, __private int4 *quo); | ||
| 2144 | half8 __ovld remquo(half8 x, half8 y, __private int8 *quo); | ||
| 2145 | half16 __ovld remquo(half16 x, half16 y, __private int16 *quo); | ||
| 2146 | #endif //cl_khr_fp16 | ||
| 2147 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2148 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 2149 | + //! CL_VERSION_2_0) | ||
| 2150 | /** | ||
| 2151 | * Round to integral value (using round to nearest | ||
| 2152 | * even rounding mode) in floating-point format. | ||
| 2153 | @@ -8311,14 +8322,14 @@ float3 __ovld __cnfn rint(float3); | ||
| 2154 | float4 __ovld __cnfn rint(float4); | ||
| 2155 | float8 __ovld __cnfn rint(float8); | ||
| 2156 | float16 __ovld __cnfn rint(float16); | ||
| 2157 | -#ifdef cl_khr_fp64 | ||
| 2158 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2159 | double __ovld __cnfn rint(double); | ||
| 2160 | double2 __ovld __cnfn rint(double2); | ||
| 2161 | double3 __ovld __cnfn rint(double3); | ||
| 2162 | double4 __ovld __cnfn rint(double4); | ||
| 2163 | double8 __ovld __cnfn rint(double8); | ||
| 2164 | double16 __ovld __cnfn rint(double16); | ||
| 2165 | -#endif //cl_khr_fp64 | ||
| 2166 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2167 | #ifdef cl_khr_fp16 | ||
| 2168 | half __ovld __cnfn rint(half); | ||
| 2169 | half2 __ovld __cnfn rint(half2); | ||
| 2170 | @@ -8337,14 +8348,14 @@ float3 __ovld __cnfn rootn(float3 x, int3 y); | ||
| 2171 | float4 __ovld __cnfn rootn(float4 x, int4 y); | ||
| 2172 | float8 __ovld __cnfn rootn(float8 x, int8 y); | ||
| 2173 | float16 __ovld __cnfn rootn(float16 x, int16 y); | ||
| 2174 | -#ifdef cl_khr_fp64 | ||
| 2175 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2176 | double __ovld __cnfn rootn(double x, int y); | ||
| 2177 | double2 __ovld __cnfn rootn(double2 x, int2 y); | ||
| 2178 | double3 __ovld __cnfn rootn(double3 x, int3 y); | ||
| 2179 | double4 __ovld __cnfn rootn(double4 x, int4 y); | ||
| 2180 | double8 __ovld __cnfn rootn(double8 x, int8 y); | ||
| 2181 | double16 __ovld __cnfn rootn(double16 x, int16 y); | ||
| 2182 | -#endif //cl_khr_fp64 | ||
| 2183 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2184 | #ifdef cl_khr_fp16 | ||
| 2185 | half __ovld __cnfn rootn(half x, int y); | ||
| 2186 | half2 __ovld __cnfn rootn(half2 x, int2 y); | ||
| 2187 | @@ -8365,14 +8376,14 @@ float3 __ovld __cnfn round(float3 x); | ||
| 2188 | float4 __ovld __cnfn round(float4 x); | ||
| 2189 | float8 __ovld __cnfn round(float8 x); | ||
| 2190 | float16 __ovld __cnfn round(float16 x); | ||
| 2191 | -#ifdef cl_khr_fp64 | ||
| 2192 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2193 | double __ovld __cnfn round(double x); | ||
| 2194 | double2 __ovld __cnfn round(double2 x); | ||
| 2195 | double3 __ovld __cnfn round(double3 x); | ||
| 2196 | double4 __ovld __cnfn round(double4 x); | ||
| 2197 | double8 __ovld __cnfn round(double8 x); | ||
| 2198 | double16 __ovld __cnfn round(double16 x); | ||
| 2199 | -#endif //cl_khr_fp64 | ||
| 2200 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2201 | #ifdef cl_khr_fp16 | ||
| 2202 | half __ovld __cnfn round(half x); | ||
| 2203 | half2 __ovld __cnfn round(half2 x); | ||
| 2204 | @@ -8391,14 +8402,14 @@ float3 __ovld __cnfn rsqrt(float3); | ||
| 2205 | float4 __ovld __cnfn rsqrt(float4); | ||
| 2206 | float8 __ovld __cnfn rsqrt(float8); | ||
| 2207 | float16 __ovld __cnfn rsqrt(float16); | ||
| 2208 | -#ifdef cl_khr_fp64 | ||
| 2209 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2210 | double __ovld __cnfn rsqrt(double); | ||
| 2211 | double2 __ovld __cnfn rsqrt(double2); | ||
| 2212 | double3 __ovld __cnfn rsqrt(double3); | ||
| 2213 | double4 __ovld __cnfn rsqrt(double4); | ||
| 2214 | double8 __ovld __cnfn rsqrt(double8); | ||
| 2215 | double16 __ovld __cnfn rsqrt(double16); | ||
| 2216 | -#endif //cl_khr_fp64 | ||
| 2217 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2218 | #ifdef cl_khr_fp16 | ||
| 2219 | half __ovld __cnfn rsqrt(half); | ||
| 2220 | half2 __ovld __cnfn rsqrt(half2); | ||
| 2221 | @@ -8417,14 +8428,14 @@ float3 __ovld __cnfn sin(float3); | ||
| 2222 | float4 __ovld __cnfn sin(float4); | ||
| 2223 | float8 __ovld __cnfn sin(float8); | ||
| 2224 | float16 __ovld __cnfn sin(float16); | ||
| 2225 | -#ifdef cl_khr_fp64 | ||
| 2226 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2227 | double __ovld __cnfn sin(double); | ||
| 2228 | double2 __ovld __cnfn sin(double2); | ||
| 2229 | double3 __ovld __cnfn sin(double3); | ||
| 2230 | double4 __ovld __cnfn sin(double4); | ||
| 2231 | double8 __ovld __cnfn sin(double8); | ||
| 2232 | double16 __ovld __cnfn sin(double16); | ||
| 2233 | -#endif //cl_khr_fp64 | ||
| 2234 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2235 | #ifdef cl_khr_fp16 | ||
| 2236 | half __ovld __cnfn sin(half); | ||
| 2237 | half2 __ovld __cnfn sin(half2); | ||
| 2238 | @@ -8439,21 +8450,21 @@ half16 __ovld __cnfn sin(half16); | ||
| 2239 | * is the return value and computed cosine is returned | ||
| 2240 | * in cosval. | ||
| 2241 | */ | ||
| 2242 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2243 | +#ifdef __opencl_c_generic_address_space | ||
| 2244 | float __ovld sincos(float x, float *cosval); | ||
| 2245 | float2 __ovld sincos(float2 x, float2 *cosval); | ||
| 2246 | float3 __ovld sincos(float3 x, float3 *cosval); | ||
| 2247 | float4 __ovld sincos(float4 x, float4 *cosval); | ||
| 2248 | float8 __ovld sincos(float8 x, float8 *cosval); | ||
| 2249 | float16 __ovld sincos(float16 x, float16 *cosval); | ||
| 2250 | -#ifdef cl_khr_fp64 | ||
| 2251 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2252 | double __ovld sincos(double x, double *cosval); | ||
| 2253 | double2 __ovld sincos(double2 x, double2 *cosval); | ||
| 2254 | double3 __ovld sincos(double3 x, double3 *cosval); | ||
| 2255 | double4 __ovld sincos(double4 x, double4 *cosval); | ||
| 2256 | double8 __ovld sincos(double8 x, double8 *cosval); | ||
| 2257 | double16 __ovld sincos(double16 x, double16 *cosval); | ||
| 2258 | -#endif //cl_khr_fp64 | ||
| 2259 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2260 | #ifdef cl_khr_fp16 | ||
| 2261 | half __ovld sincos(half x, half *cosval); | ||
| 2262 | half2 __ovld sincos(half2 x, half2 *cosval); | ||
| 2263 | @@ -8462,7 +8473,9 @@ half4 __ovld sincos(half4 x, half4 *cosval); | ||
| 2264 | half8 __ovld sincos(half8 x, half8 *cosval); | ||
| 2265 | half16 __ovld sincos(half16 x, half16 *cosval); | ||
| 2266 | #endif //cl_khr_fp16 | ||
| 2267 | -#else | ||
| 2268 | +#endif //__opencl_c_generic_address_space | ||
| 2269 | + | ||
| 2270 | +#if !defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != CL_VERSION_2_0) | ||
| 2271 | float __ovld sincos(float x, __global float *cosval); | ||
| 2272 | float2 __ovld sincos(float2 x, __global float2 *cosval); | ||
| 2273 | float3 __ovld sincos(float3 x, __global float3 *cosval); | ||
| 2274 | @@ -8481,7 +8494,7 @@ float3 __ovld sincos(float3 x, __private float3 *cosval); | ||
| 2275 | float4 __ovld sincos(float4 x, __private float4 *cosval); | ||
| 2276 | float8 __ovld sincos(float8 x, __private float8 *cosval); | ||
| 2277 | float16 __ovld sincos(float16 x, __private float16 *cosval); | ||
| 2278 | -#ifdef cl_khr_fp64 | ||
| 2279 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2280 | double __ovld sincos(double x, __global double *cosval); | ||
| 2281 | double2 __ovld sincos(double2 x, __global double2 *cosval); | ||
| 2282 | double3 __ovld sincos(double3 x, __global double3 *cosval); | ||
| 2283 | @@ -8500,7 +8513,7 @@ double3 __ovld sincos(double3 x, __private double3 *cosval); | ||
| 2284 | double4 __ovld sincos(double4 x, __private double4 *cosval); | ||
| 2285 | double8 __ovld sincos(double8 x, __private double8 *cosval); | ||
| 2286 | double16 __ovld sincos(double16 x, __private double16 *cosval); | ||
| 2287 | -#endif //cl_khr_fp64 | ||
| 2288 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2289 | #ifdef cl_khr_fp16 | ||
| 2290 | half __ovld sincos(half x, __global half *cosval); | ||
| 2291 | half2 __ovld sincos(half2 x, __global half2 *cosval); | ||
| 2292 | @@ -8521,8 +8534,8 @@ half4 __ovld sincos(half4 x, __private half4 *cosval); | ||
| 2293 | half8 __ovld sincos(half8 x, __private half8 *cosval); | ||
| 2294 | half16 __ovld sincos(half16 x, __private half16 *cosval); | ||
| 2295 | #endif //cl_khr_fp16 | ||
| 2296 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2297 | - | ||
| 2298 | +#endif //! defined(__OPENCL_CPP_VERSION__) && (__OPENCL_C_VERSION__ != | ||
| 2299 | + //! CL_VERSION_2_0) | ||
| 2300 | /** | ||
| 2301 | * Compute hyperbolic sine. | ||
| 2302 | */ | ||
| 2303 | @@ -8532,14 +8545,14 @@ float3 __ovld __cnfn sinh(float3); | ||
| 2304 | float4 __ovld __cnfn sinh(float4); | ||
| 2305 | float8 __ovld __cnfn sinh(float8); | ||
| 2306 | float16 __ovld __cnfn sinh(float16); | ||
| 2307 | -#ifdef cl_khr_fp64 | ||
| 2308 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2309 | double __ovld __cnfn sinh(double); | ||
| 2310 | double2 __ovld __cnfn sinh(double2); | ||
| 2311 | double3 __ovld __cnfn sinh(double3); | ||
| 2312 | double4 __ovld __cnfn sinh(double4); | ||
| 2313 | double8 __ovld __cnfn sinh(double8); | ||
| 2314 | double16 __ovld __cnfn sinh(double16); | ||
| 2315 | -#endif //cl_khr_fp64 | ||
| 2316 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2317 | #ifdef cl_khr_fp16 | ||
| 2318 | half __ovld __cnfn sinh(half); | ||
| 2319 | half2 __ovld __cnfn sinh(half2); | ||
| 2320 | @@ -8558,14 +8571,14 @@ float3 __ovld __cnfn sinpi(float3 x); | ||
| 2321 | float4 __ovld __cnfn sinpi(float4 x); | ||
| 2322 | float8 __ovld __cnfn sinpi(float8 x); | ||
| 2323 | float16 __ovld __cnfn sinpi(float16 x); | ||
| 2324 | -#ifdef cl_khr_fp64 | ||
| 2325 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2326 | double __ovld __cnfn sinpi(double x); | ||
| 2327 | double2 __ovld __cnfn sinpi(double2 x); | ||
| 2328 | double3 __ovld __cnfn sinpi(double3 x); | ||
| 2329 | double4 __ovld __cnfn sinpi(double4 x); | ||
| 2330 | double8 __ovld __cnfn sinpi(double8 x); | ||
| 2331 | double16 __ovld __cnfn sinpi(double16 x); | ||
| 2332 | -#endif //cl_khr_fp64 | ||
| 2333 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2334 | #ifdef cl_khr_fp16 | ||
| 2335 | half __ovld __cnfn sinpi(half x); | ||
| 2336 | half2 __ovld __cnfn sinpi(half2 x); | ||
| 2337 | @@ -8584,14 +8597,14 @@ float3 __ovld __cnfn sqrt(float3); | ||
| 2338 | float4 __ovld __cnfn sqrt(float4); | ||
| 2339 | float8 __ovld __cnfn sqrt(float8); | ||
| 2340 | float16 __ovld __cnfn sqrt(float16); | ||
| 2341 | -#ifdef cl_khr_fp64 | ||
| 2342 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2343 | double __ovld __cnfn sqrt(double); | ||
| 2344 | double2 __ovld __cnfn sqrt(double2); | ||
| 2345 | double3 __ovld __cnfn sqrt(double3); | ||
| 2346 | double4 __ovld __cnfn sqrt(double4); | ||
| 2347 | double8 __ovld __cnfn sqrt(double8); | ||
| 2348 | double16 __ovld __cnfn sqrt(double16); | ||
| 2349 | -#endif //cl_khr_fp64 | ||
| 2350 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2351 | #ifdef cl_khr_fp16 | ||
| 2352 | half __ovld __cnfn sqrt(half); | ||
| 2353 | half2 __ovld __cnfn sqrt(half2); | ||
| 2354 | @@ -8610,14 +8623,14 @@ float3 __ovld __cnfn tan(float3); | ||
| 2355 | float4 __ovld __cnfn tan(float4); | ||
| 2356 | float8 __ovld __cnfn tan(float8); | ||
| 2357 | float16 __ovld __cnfn tan(float16); | ||
| 2358 | -#ifdef cl_khr_fp64 | ||
| 2359 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2360 | double __ovld __cnfn tan(double); | ||
| 2361 | double2 __ovld __cnfn tan(double2); | ||
| 2362 | double3 __ovld __cnfn tan(double3); | ||
| 2363 | double4 __ovld __cnfn tan(double4); | ||
| 2364 | double8 __ovld __cnfn tan(double8); | ||
| 2365 | double16 __ovld __cnfn tan(double16); | ||
| 2366 | -#endif //cl_khr_fp64 | ||
| 2367 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2368 | #ifdef cl_khr_fp16 | ||
| 2369 | half __ovld __cnfn tan(half); | ||
| 2370 | half2 __ovld __cnfn tan(half2); | ||
| 2371 | @@ -8636,14 +8649,14 @@ float3 __ovld __cnfn tanh(float3); | ||
| 2372 | float4 __ovld __cnfn tanh(float4); | ||
| 2373 | float8 __ovld __cnfn tanh(float8); | ||
| 2374 | float16 __ovld __cnfn tanh(float16); | ||
| 2375 | -#ifdef cl_khr_fp64 | ||
| 2376 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2377 | double __ovld __cnfn tanh(double); | ||
| 2378 | double2 __ovld __cnfn tanh(double2); | ||
| 2379 | double3 __ovld __cnfn tanh(double3); | ||
| 2380 | double4 __ovld __cnfn tanh(double4); | ||
| 2381 | double8 __ovld __cnfn tanh(double8); | ||
| 2382 | double16 __ovld __cnfn tanh(double16); | ||
| 2383 | -#endif //cl_khr_fp64 | ||
| 2384 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2385 | #ifdef cl_khr_fp16 | ||
| 2386 | half __ovld __cnfn tanh(half); | ||
| 2387 | half2 __ovld __cnfn tanh(half2); | ||
| 2388 | @@ -8662,14 +8675,14 @@ float3 __ovld __cnfn tanpi(float3 x); | ||
| 2389 | float4 __ovld __cnfn tanpi(float4 x); | ||
| 2390 | float8 __ovld __cnfn tanpi(float8 x); | ||
| 2391 | float16 __ovld __cnfn tanpi(float16 x); | ||
| 2392 | -#ifdef cl_khr_fp64 | ||
| 2393 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2394 | double __ovld __cnfn tanpi(double x); | ||
| 2395 | double2 __ovld __cnfn tanpi(double2 x); | ||
| 2396 | double3 __ovld __cnfn tanpi(double3 x); | ||
| 2397 | double4 __ovld __cnfn tanpi(double4 x); | ||
| 2398 | double8 __ovld __cnfn tanpi(double8 x); | ||
| 2399 | double16 __ovld __cnfn tanpi(double16 x); | ||
| 2400 | -#endif //cl_khr_fp64 | ||
| 2401 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2402 | #ifdef cl_khr_fp16 | ||
| 2403 | half __ovld __cnfn tanpi(half x); | ||
| 2404 | half2 __ovld __cnfn tanpi(half2 x); | ||
| 2405 | @@ -8688,14 +8701,14 @@ float3 __ovld __cnfn tgamma(float3); | ||
| 2406 | float4 __ovld __cnfn tgamma(float4); | ||
| 2407 | float8 __ovld __cnfn tgamma(float8); | ||
| 2408 | float16 __ovld __cnfn tgamma(float16); | ||
| 2409 | -#ifdef cl_khr_fp64 | ||
| 2410 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2411 | double __ovld __cnfn tgamma(double); | ||
| 2412 | double2 __ovld __cnfn tgamma(double2); | ||
| 2413 | double3 __ovld __cnfn tgamma(double3); | ||
| 2414 | double4 __ovld __cnfn tgamma(double4); | ||
| 2415 | double8 __ovld __cnfn tgamma(double8); | ||
| 2416 | double16 __ovld __cnfn tgamma(double16); | ||
| 2417 | -#endif //cl_khr_fp64 | ||
| 2418 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2419 | #ifdef cl_khr_fp16 | ||
| 2420 | half __ovld __cnfn tgamma(half); | ||
| 2421 | half2 __ovld __cnfn tgamma(half2); | ||
| 2422 | @@ -8715,14 +8728,14 @@ float3 __ovld __cnfn trunc(float3); | ||
| 2423 | float4 __ovld __cnfn trunc(float4); | ||
| 2424 | float8 __ovld __cnfn trunc(float8); | ||
| 2425 | float16 __ovld __cnfn trunc(float16); | ||
| 2426 | -#ifdef cl_khr_fp64 | ||
| 2427 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2428 | double __ovld __cnfn trunc(double); | ||
| 2429 | double2 __ovld __cnfn trunc(double2); | ||
| 2430 | double3 __ovld __cnfn trunc(double3); | ||
| 2431 | double4 __ovld __cnfn trunc(double4); | ||
| 2432 | double8 __ovld __cnfn trunc(double8); | ||
| 2433 | double16 __ovld __cnfn trunc(double16); | ||
| 2434 | -#endif //cl_khr_fp64 | ||
| 2435 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2436 | #ifdef cl_khr_fp16 | ||
| 2437 | half __ovld __cnfn trunc(half); | ||
| 2438 | half2 __ovld __cnfn trunc(half2); | ||
| 2439 | @@ -10108,7 +10121,7 @@ float3 __ovld __cnfn clamp(float3 x, float minval, float maxval); | ||
| 2440 | float4 __ovld __cnfn clamp(float4 x, float minval, float maxval); | ||
| 2441 | float8 __ovld __cnfn clamp(float8 x, float minval, float maxval); | ||
| 2442 | float16 __ovld __cnfn clamp(float16 x, float minval, float maxval); | ||
| 2443 | -#ifdef cl_khr_fp64 | ||
| 2444 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2445 | double __ovld __cnfn clamp(double x, double minval, double maxval); | ||
| 2446 | double2 __ovld __cnfn clamp(double2 x, double2 minval, double2 maxval); | ||
| 2447 | double3 __ovld __cnfn clamp(double3 x, double3 minval, double3 maxval); | ||
| 2448 | @@ -10120,7 +10133,7 @@ double3 __ovld __cnfn clamp(double3 x, double minval, double maxval); | ||
| 2449 | double4 __ovld __cnfn clamp(double4 x, double minval, double maxval); | ||
| 2450 | double8 __ovld __cnfn clamp(double8 x, double minval, double maxval); | ||
| 2451 | double16 __ovld __cnfn clamp(double16 x, double minval, double maxval); | ||
| 2452 | -#endif //cl_khr_fp64 | ||
| 2453 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2454 | #ifdef cl_khr_fp16 | ||
| 2455 | half __ovld __cnfn clamp(half x, half minval, half maxval); | ||
| 2456 | half2 __ovld __cnfn clamp(half2 x, half2 minval, half2 maxval); | ||
| 2457 | @@ -10145,14 +10158,14 @@ float3 __ovld __cnfn degrees(float3 radians); | ||
| 2458 | float4 __ovld __cnfn degrees(float4 radians); | ||
| 2459 | float8 __ovld __cnfn degrees(float8 radians); | ||
| 2460 | float16 __ovld __cnfn degrees(float16 radians); | ||
| 2461 | -#ifdef cl_khr_fp64 | ||
| 2462 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2463 | double __ovld __cnfn degrees(double radians); | ||
| 2464 | double2 __ovld __cnfn degrees(double2 radians); | ||
| 2465 | double3 __ovld __cnfn degrees(double3 radians); | ||
| 2466 | double4 __ovld __cnfn degrees(double4 radians); | ||
| 2467 | double8 __ovld __cnfn degrees(double8 radians); | ||
| 2468 | double16 __ovld __cnfn degrees(double16 radians); | ||
| 2469 | -#endif //cl_khr_fp64 | ||
| 2470 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2471 | #ifdef cl_khr_fp16 | ||
| 2472 | half __ovld __cnfn degrees(half radians); | ||
| 2473 | half2 __ovld __cnfn degrees(half2 radians); | ||
| 2474 | @@ -10177,7 +10190,7 @@ float3 __ovld __cnfn max(float3 x, float y); | ||
| 2475 | float4 __ovld __cnfn max(float4 x, float y); | ||
| 2476 | float8 __ovld __cnfn max(float8 x, float y); | ||
| 2477 | float16 __ovld __cnfn max(float16 x, float y); | ||
| 2478 | -#ifdef cl_khr_fp64 | ||
| 2479 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2480 | double __ovld __cnfn max(double x, double y); | ||
| 2481 | double2 __ovld __cnfn max(double2 x, double2 y); | ||
| 2482 | double3 __ovld __cnfn max(double3 x, double3 y); | ||
| 2483 | @@ -10189,7 +10202,7 @@ double3 __ovld __cnfn max(double3 x, double y); | ||
| 2484 | double4 __ovld __cnfn max(double4 x, double y); | ||
| 2485 | double8 __ovld __cnfn max(double8 x, double y); | ||
| 2486 | double16 __ovld __cnfn max(double16 x, double y); | ||
| 2487 | -#endif //cl_khr_fp64 | ||
| 2488 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2489 | #ifdef cl_khr_fp16 | ||
| 2490 | half __ovld __cnfn max(half x, half y); | ||
| 2491 | half2 __ovld __cnfn max(half2 x, half2 y); | ||
| 2492 | @@ -10219,7 +10232,7 @@ float3 __ovld __cnfn min(float3 x, float y); | ||
| 2493 | float4 __ovld __cnfn min(float4 x, float y); | ||
| 2494 | float8 __ovld __cnfn min(float8 x, float y); | ||
| 2495 | float16 __ovld __cnfn min(float16 x, float y); | ||
| 2496 | -#ifdef cl_khr_fp64 | ||
| 2497 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2498 | double __ovld __cnfn min(double x, double y); | ||
| 2499 | double2 __ovld __cnfn min(double2 x, double2 y); | ||
| 2500 | double3 __ovld __cnfn min(double3 x, double3 y); | ||
| 2501 | @@ -10231,7 +10244,7 @@ double3 __ovld __cnfn min(double3 x, double y); | ||
| 2502 | double4 __ovld __cnfn min(double4 x, double y); | ||
| 2503 | double8 __ovld __cnfn min(double8 x, double y); | ||
| 2504 | double16 __ovld __cnfn min(double16 x, double y); | ||
| 2505 | -#endif //cl_khr_fp64 | ||
| 2506 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2507 | #ifdef cl_khr_fp16 | ||
| 2508 | half __ovld __cnfn min(half x, half y); | ||
| 2509 | half2 __ovld __cnfn min(half2 x, half2 y); | ||
| 2510 | @@ -10264,7 +10277,7 @@ float3 __ovld __cnfn mix(float3 x, float3 y, float a); | ||
| 2511 | float4 __ovld __cnfn mix(float4 x, float4 y, float a); | ||
| 2512 | float8 __ovld __cnfn mix(float8 x, float8 y, float a); | ||
| 2513 | float16 __ovld __cnfn mix(float16 x, float16 y, float a); | ||
| 2514 | -#ifdef cl_khr_fp64 | ||
| 2515 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2516 | double __ovld __cnfn mix(double x, double y, double a); | ||
| 2517 | double2 __ovld __cnfn mix(double2 x, double2 y, double2 a); | ||
| 2518 | double3 __ovld __cnfn mix(double3 x, double3 y, double3 a); | ||
| 2519 | @@ -10276,7 +10289,7 @@ double3 __ovld __cnfn mix(double3 x, double3 y, double a); | ||
| 2520 | double4 __ovld __cnfn mix(double4 x, double4 y, double a); | ||
| 2521 | double8 __ovld __cnfn mix(double8 x, double8 y, double a); | ||
| 2522 | double16 __ovld __cnfn mix(double16 x, double16 y, double a); | ||
| 2523 | -#endif //cl_khr_fp64 | ||
| 2524 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2525 | #ifdef cl_khr_fp16 | ||
| 2526 | half __ovld __cnfn mix(half x, half y, half a); | ||
| 2527 | half2 __ovld __cnfn mix(half2 x, half2 y, half2 a); | ||
| 2528 | @@ -10301,14 +10314,14 @@ float3 __ovld __cnfn radians(float3 degrees); | ||
| 2529 | float4 __ovld __cnfn radians(float4 degrees); | ||
| 2530 | float8 __ovld __cnfn radians(float8 degrees); | ||
| 2531 | float16 __ovld __cnfn radians(float16 degrees); | ||
| 2532 | -#ifdef cl_khr_fp64 | ||
| 2533 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2534 | double __ovld __cnfn radians(double degrees); | ||
| 2535 | double2 __ovld __cnfn radians(double2 degrees); | ||
| 2536 | double3 __ovld __cnfn radians(double3 degrees); | ||
| 2537 | double4 __ovld __cnfn radians(double4 degrees); | ||
| 2538 | double8 __ovld __cnfn radians(double8 degrees); | ||
| 2539 | double16 __ovld __cnfn radians(double16 degrees); | ||
| 2540 | -#endif //cl_khr_fp64 | ||
| 2541 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2542 | #ifdef cl_khr_fp16 | ||
| 2543 | half __ovld __cnfn radians(half degrees); | ||
| 2544 | half2 __ovld __cnfn radians(half2 degrees); | ||
| 2545 | @@ -10332,7 +10345,7 @@ float3 __ovld __cnfn step(float edge, float3 x); | ||
| 2546 | float4 __ovld __cnfn step(float edge, float4 x); | ||
| 2547 | float8 __ovld __cnfn step(float edge, float8 x); | ||
| 2548 | float16 __ovld __cnfn step(float edge, float16 x); | ||
| 2549 | -#ifdef cl_khr_fp64 | ||
| 2550 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2551 | double __ovld __cnfn step(double edge, double x); | ||
| 2552 | double2 __ovld __cnfn step(double2 edge, double2 x); | ||
| 2553 | double3 __ovld __cnfn step(double3 edge, double3 x); | ||
| 2554 | @@ -10344,7 +10357,7 @@ double3 __ovld __cnfn step(double edge, double3 x); | ||
| 2555 | double4 __ovld __cnfn step(double edge, double4 x); | ||
| 2556 | double8 __ovld __cnfn step(double edge, double8 x); | ||
| 2557 | double16 __ovld __cnfn step(double edge, double16 x); | ||
| 2558 | -#endif //cl_khr_fp64 | ||
| 2559 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2560 | #ifdef cl_khr_fp16 | ||
| 2561 | half __ovld __cnfn step(half edge, half x); | ||
| 2562 | half2 __ovld __cnfn step(half2 edge, half2 x); | ||
| 2563 | @@ -10383,7 +10396,7 @@ float3 __ovld __cnfn smoothstep(float edge0, float edge1, float3 x); | ||
| 2564 | float4 __ovld __cnfn smoothstep(float edge0, float edge1, float4 x); | ||
| 2565 | float8 __ovld __cnfn smoothstep(float edge0, float edge1, float8 x); | ||
| 2566 | float16 __ovld __cnfn smoothstep(float edge0, float edge1, float16 x); | ||
| 2567 | -#ifdef cl_khr_fp64 | ||
| 2568 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2569 | double __ovld __cnfn smoothstep(double edge0, double edge1, double x); | ||
| 2570 | double2 __ovld __cnfn smoothstep(double2 edge0, double2 edge1, double2 x); | ||
| 2571 | double3 __ovld __cnfn smoothstep(double3 edge0, double3 edge1, double3 x); | ||
| 2572 | @@ -10395,7 +10408,7 @@ double3 __ovld __cnfn smoothstep(double edge0, double edge1, double3 x); | ||
| 2573 | double4 __ovld __cnfn smoothstep(double edge0, double edge1, double4 x); | ||
| 2574 | double8 __ovld __cnfn smoothstep(double edge0, double edge1, double8 x); | ||
| 2575 | double16 __ovld __cnfn smoothstep(double edge0, double edge1, double16 x); | ||
| 2576 | -#endif //cl_khr_fp64 | ||
| 2577 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2578 | #ifdef cl_khr_fp16 | ||
| 2579 | half __ovld __cnfn smoothstep(half edge0, half edge1, half x); | ||
| 2580 | half2 __ovld __cnfn smoothstep(half2 edge0, half2 edge1, half2 x); | ||
| 2581 | @@ -10420,14 +10433,14 @@ float3 __ovld __cnfn sign(float3 x); | ||
| 2582 | float4 __ovld __cnfn sign(float4 x); | ||
| 2583 | float8 __ovld __cnfn sign(float8 x); | ||
| 2584 | float16 __ovld __cnfn sign(float16 x); | ||
| 2585 | -#ifdef cl_khr_fp64 | ||
| 2586 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2587 | double __ovld __cnfn sign(double x); | ||
| 2588 | double2 __ovld __cnfn sign(double2 x); | ||
| 2589 | double3 __ovld __cnfn sign(double3 x); | ||
| 2590 | double4 __ovld __cnfn sign(double4 x); | ||
| 2591 | double8 __ovld __cnfn sign(double8 x); | ||
| 2592 | double16 __ovld __cnfn sign(double16 x); | ||
| 2593 | -#endif //cl_khr_fp64 | ||
| 2594 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2595 | #ifdef cl_khr_fp16 | ||
| 2596 | half __ovld __cnfn sign(half x); | ||
| 2597 | half2 __ovld __cnfn sign(half2 x); | ||
| 2598 | @@ -10445,10 +10458,10 @@ half16 __ovld __cnfn sign(half16 x); | ||
| 2599 | */ | ||
| 2600 | float4 __ovld __cnfn cross(float4 p0, float4 p1); | ||
| 2601 | float3 __ovld __cnfn cross(float3 p0, float3 p1); | ||
| 2602 | -#ifdef cl_khr_fp64 | ||
| 2603 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2604 | double4 __ovld __cnfn cross(double4 p0, double4 p1); | ||
| 2605 | double3 __ovld __cnfn cross(double3 p0, double3 p1); | ||
| 2606 | -#endif //cl_khr_fp64 | ||
| 2607 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2608 | #ifdef cl_khr_fp16 | ||
| 2609 | half4 __ovld __cnfn cross(half4 p0, half4 p1); | ||
| 2610 | half3 __ovld __cnfn cross(half3 p0, half3 p1); | ||
| 2611 | @@ -10461,12 +10474,12 @@ float __ovld __cnfn dot(float p0, float p1); | ||
| 2612 | float __ovld __cnfn dot(float2 p0, float2 p1); | ||
| 2613 | float __ovld __cnfn dot(float3 p0, float3 p1); | ||
| 2614 | float __ovld __cnfn dot(float4 p0, float4 p1); | ||
| 2615 | -#ifdef cl_khr_fp64 | ||
| 2616 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2617 | double __ovld __cnfn dot(double p0, double p1); | ||
| 2618 | double __ovld __cnfn dot(double2 p0, double2 p1); | ||
| 2619 | double __ovld __cnfn dot(double3 p0, double3 p1); | ||
| 2620 | double __ovld __cnfn dot(double4 p0, double4 p1); | ||
| 2621 | -#endif //cl_khr_fp64 | ||
| 2622 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2623 | #ifdef cl_khr_fp16 | ||
| 2624 | half __ovld __cnfn dot(half p0, half p1); | ||
| 2625 | half __ovld __cnfn dot(half2 p0, half2 p1); | ||
| 2626 | @@ -10482,12 +10495,12 @@ float __ovld __cnfn distance(float p0, float p1); | ||
| 2627 | float __ovld __cnfn distance(float2 p0, float2 p1); | ||
| 2628 | float __ovld __cnfn distance(float3 p0, float3 p1); | ||
| 2629 | float __ovld __cnfn distance(float4 p0, float4 p1); | ||
| 2630 | -#ifdef cl_khr_fp64 | ||
| 2631 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2632 | double __ovld __cnfn distance(double p0, double p1); | ||
| 2633 | double __ovld __cnfn distance(double2 p0, double2 p1); | ||
| 2634 | double __ovld __cnfn distance(double3 p0, double3 p1); | ||
| 2635 | double __ovld __cnfn distance(double4 p0, double4 p1); | ||
| 2636 | -#endif //cl_khr_fp64 | ||
| 2637 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2638 | #ifdef cl_khr_fp16 | ||
| 2639 | half __ovld __cnfn distance(half p0, half p1); | ||
| 2640 | half __ovld __cnfn distance(half2 p0, half2 p1); | ||
| 2641 | @@ -10503,12 +10516,12 @@ float __ovld __cnfn length(float p); | ||
| 2642 | float __ovld __cnfn length(float2 p); | ||
| 2643 | float __ovld __cnfn length(float3 p); | ||
| 2644 | float __ovld __cnfn length(float4 p); | ||
| 2645 | -#ifdef cl_khr_fp64 | ||
| 2646 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2647 | double __ovld __cnfn length(double p); | ||
| 2648 | double __ovld __cnfn length(double2 p); | ||
| 2649 | double __ovld __cnfn length(double3 p); | ||
| 2650 | double __ovld __cnfn length(double4 p); | ||
| 2651 | -#endif //cl_khr_fp64 | ||
| 2652 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2653 | #ifdef cl_khr_fp16 | ||
| 2654 | half __ovld __cnfn length(half p); | ||
| 2655 | half __ovld __cnfn length(half2 p); | ||
| 2656 | @@ -10524,12 +10537,12 @@ float __ovld __cnfn normalize(float p); | ||
| 2657 | float2 __ovld __cnfn normalize(float2 p); | ||
| 2658 | float3 __ovld __cnfn normalize(float3 p); | ||
| 2659 | float4 __ovld __cnfn normalize(float4 p); | ||
| 2660 | -#ifdef cl_khr_fp64 | ||
| 2661 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2662 | double __ovld __cnfn normalize(double p); | ||
| 2663 | double2 __ovld __cnfn normalize(double2 p); | ||
| 2664 | double3 __ovld __cnfn normalize(double3 p); | ||
| 2665 | double4 __ovld __cnfn normalize(double4 p); | ||
| 2666 | -#endif //cl_khr_fp64 | ||
| 2667 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2668 | #ifdef cl_khr_fp16 | ||
| 2669 | half __ovld __cnfn normalize(half p); | ||
| 2670 | half2 __ovld __cnfn normalize(half2 p); | ||
| 2671 | @@ -10610,14 +10623,14 @@ int3 __ovld __cnfn isequal(float3 x, float3 y); | ||
| 2672 | int4 __ovld __cnfn isequal(float4 x, float4 y); | ||
| 2673 | int8 __ovld __cnfn isequal(float8 x, float8 y); | ||
| 2674 | int16 __ovld __cnfn isequal(float16 x, float16 y); | ||
| 2675 | -#ifdef cl_khr_fp64 | ||
| 2676 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2677 | int __ovld __cnfn isequal(double x, double y); | ||
| 2678 | long2 __ovld __cnfn isequal(double2 x, double2 y); | ||
| 2679 | long3 __ovld __cnfn isequal(double3 x, double3 y); | ||
| 2680 | long4 __ovld __cnfn isequal(double4 x, double4 y); | ||
| 2681 | long8 __ovld __cnfn isequal(double8 x, double8 y); | ||
| 2682 | long16 __ovld __cnfn isequal(double16 x, double16 y); | ||
| 2683 | -#endif //cl_khr_fp64 | ||
| 2684 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2685 | #ifdef cl_khr_fp16 | ||
| 2686 | int __ovld __cnfn isequal(half x, half y); | ||
| 2687 | short2 __ovld __cnfn isequal(half2 x, half2 y); | ||
| 2688 | @@ -10636,14 +10649,14 @@ int3 __ovld __cnfn isnotequal(float3 x, float3 y); | ||
| 2689 | int4 __ovld __cnfn isnotequal(float4 x, float4 y); | ||
| 2690 | int8 __ovld __cnfn isnotequal(float8 x, float8 y); | ||
| 2691 | int16 __ovld __cnfn isnotequal(float16 x, float16 y); | ||
| 2692 | -#ifdef cl_khr_fp64 | ||
| 2693 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2694 | int __ovld __cnfn isnotequal(double x, double y); | ||
| 2695 | long2 __ovld __cnfn isnotequal(double2 x, double2 y); | ||
| 2696 | long3 __ovld __cnfn isnotequal(double3 x, double3 y); | ||
| 2697 | long4 __ovld __cnfn isnotequal(double4 x, double4 y); | ||
| 2698 | long8 __ovld __cnfn isnotequal(double8 x, double8 y); | ||
| 2699 | long16 __ovld __cnfn isnotequal(double16 x, double16 y); | ||
| 2700 | -#endif //cl_khr_fp64 | ||
| 2701 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2702 | #ifdef cl_khr_fp16 | ||
| 2703 | int __ovld __cnfn isnotequal(half x, half y); | ||
| 2704 | short2 __ovld __cnfn isnotequal(half2 x, half2 y); | ||
| 2705 | @@ -10662,14 +10675,14 @@ int3 __ovld __cnfn isgreater(float3 x, float3 y); | ||
| 2706 | int4 __ovld __cnfn isgreater(float4 x, float4 y); | ||
| 2707 | int8 __ovld __cnfn isgreater(float8 x, float8 y); | ||
| 2708 | int16 __ovld __cnfn isgreater(float16 x, float16 y); | ||
| 2709 | -#ifdef cl_khr_fp64 | ||
| 2710 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2711 | int __ovld __cnfn isgreater(double x, double y); | ||
| 2712 | long2 __ovld __cnfn isgreater(double2 x, double2 y); | ||
| 2713 | long3 __ovld __cnfn isgreater(double3 x, double3 y); | ||
| 2714 | long4 __ovld __cnfn isgreater(double4 x, double4 y); | ||
| 2715 | long8 __ovld __cnfn isgreater(double8 x, double8 y); | ||
| 2716 | long16 __ovld __cnfn isgreater(double16 x, double16 y); | ||
| 2717 | -#endif //cl_khr_fp64 | ||
| 2718 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2719 | #ifdef cl_khr_fp16 | ||
| 2720 | int __ovld __cnfn isgreater(half x, half y); | ||
| 2721 | short2 __ovld __cnfn isgreater(half2 x, half2 y); | ||
| 2722 | @@ -10688,14 +10701,14 @@ int3 __ovld __cnfn isgreaterequal(float3 x, float3 y); | ||
| 2723 | int4 __ovld __cnfn isgreaterequal(float4 x, float4 y); | ||
| 2724 | int8 __ovld __cnfn isgreaterequal(float8 x, float8 y); | ||
| 2725 | int16 __ovld __cnfn isgreaterequal(float16 x, float16 y); | ||
| 2726 | -#ifdef cl_khr_fp64 | ||
| 2727 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2728 | int __ovld __cnfn isgreaterequal(double x, double y); | ||
| 2729 | long2 __ovld __cnfn isgreaterequal(double2 x, double2 y); | ||
| 2730 | long3 __ovld __cnfn isgreaterequal(double3 x, double3 y); | ||
| 2731 | long4 __ovld __cnfn isgreaterequal(double4 x, double4 y); | ||
| 2732 | long8 __ovld __cnfn isgreaterequal(double8 x, double8 y); | ||
| 2733 | long16 __ovld __cnfn isgreaterequal(double16 x, double16 y); | ||
| 2734 | -#endif //cl_khr_fp64 | ||
| 2735 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2736 | #ifdef cl_khr_fp16 | ||
| 2737 | int __ovld __cnfn isgreaterequal(half x, half y); | ||
| 2738 | short2 __ovld __cnfn isgreaterequal(half2 x, half2 y); | ||
| 2739 | @@ -10714,14 +10727,14 @@ int3 __ovld __cnfn isless(float3 x, float3 y); | ||
| 2740 | int4 __ovld __cnfn isless(float4 x, float4 y); | ||
| 2741 | int8 __ovld __cnfn isless(float8 x, float8 y); | ||
| 2742 | int16 __ovld __cnfn isless(float16 x, float16 y); | ||
| 2743 | -#ifdef cl_khr_fp64 | ||
| 2744 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2745 | int __ovld __cnfn isless(double x, double y); | ||
| 2746 | long2 __ovld __cnfn isless(double2 x, double2 y); | ||
| 2747 | long3 __ovld __cnfn isless(double3 x, double3 y); | ||
| 2748 | long4 __ovld __cnfn isless(double4 x, double4 y); | ||
| 2749 | long8 __ovld __cnfn isless(double8 x, double8 y); | ||
| 2750 | long16 __ovld __cnfn isless(double16 x, double16 y); | ||
| 2751 | -#endif //cl_khr_fp64 | ||
| 2752 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2753 | #ifdef cl_khr_fp16 | ||
| 2754 | int __ovld __cnfn isless(half x, half y); | ||
| 2755 | short2 __ovld __cnfn isless(half2 x, half2 y); | ||
| 2756 | @@ -10740,14 +10753,14 @@ int3 __ovld __cnfn islessequal(float3 x, float3 y); | ||
| 2757 | int4 __ovld __cnfn islessequal(float4 x, float4 y); | ||
| 2758 | int8 __ovld __cnfn islessequal(float8 x, float8 y); | ||
| 2759 | int16 __ovld __cnfn islessequal(float16 x, float16 y); | ||
| 2760 | -#ifdef cl_khr_fp64 | ||
| 2761 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2762 | int __ovld __cnfn islessequal(double x, double y); | ||
| 2763 | long2 __ovld __cnfn islessequal(double2 x, double2 y); | ||
| 2764 | long3 __ovld __cnfn islessequal(double3 x, double3 y); | ||
| 2765 | long4 __ovld __cnfn islessequal(double4 x, double4 y); | ||
| 2766 | long8 __ovld __cnfn islessequal(double8 x, double8 y); | ||
| 2767 | long16 __ovld __cnfn islessequal(double16 x, double16 y); | ||
| 2768 | -#endif //cl_khr_fp64 | ||
| 2769 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2770 | #ifdef cl_khr_fp16 | ||
| 2771 | int __ovld __cnfn islessequal(half x, half y); | ||
| 2772 | short2 __ovld __cnfn islessequal(half2 x, half2 y); | ||
| 2773 | @@ -10767,14 +10780,14 @@ int3 __ovld __cnfn islessgreater(float3 x, float3 y); | ||
| 2774 | int4 __ovld __cnfn islessgreater(float4 x, float4 y); | ||
| 2775 | int8 __ovld __cnfn islessgreater(float8 x, float8 y); | ||
| 2776 | int16 __ovld __cnfn islessgreater(float16 x, float16 y); | ||
| 2777 | -#ifdef cl_khr_fp64 | ||
| 2778 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2779 | int __ovld __cnfn islessgreater(double x, double y); | ||
| 2780 | long2 __ovld __cnfn islessgreater(double2 x, double2 y); | ||
| 2781 | long3 __ovld __cnfn islessgreater(double3 x, double3 y); | ||
| 2782 | long4 __ovld __cnfn islessgreater(double4 x, double4 y); | ||
| 2783 | long8 __ovld __cnfn islessgreater(double8 x, double8 y); | ||
| 2784 | long16 __ovld __cnfn islessgreater(double16 x, double16 y); | ||
| 2785 | -#endif //cl_khr_fp64 | ||
| 2786 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2787 | #ifdef cl_khr_fp16 | ||
| 2788 | int __ovld __cnfn islessgreater(half x, half y); | ||
| 2789 | short2 __ovld __cnfn islessgreater(half2 x, half2 y); | ||
| 2790 | @@ -10793,14 +10806,14 @@ int3 __ovld __cnfn isfinite(float3); | ||
| 2791 | int4 __ovld __cnfn isfinite(float4); | ||
| 2792 | int8 __ovld __cnfn isfinite(float8); | ||
| 2793 | int16 __ovld __cnfn isfinite(float16); | ||
| 2794 | -#ifdef cl_khr_fp64 | ||
| 2795 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2796 | int __ovld __cnfn isfinite(double); | ||
| 2797 | long2 __ovld __cnfn isfinite(double2); | ||
| 2798 | long3 __ovld __cnfn isfinite(double3); | ||
| 2799 | long4 __ovld __cnfn isfinite(double4); | ||
| 2800 | long8 __ovld __cnfn isfinite(double8); | ||
| 2801 | long16 __ovld __cnfn isfinite(double16); | ||
| 2802 | -#endif //cl_khr_fp64 | ||
| 2803 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2804 | #ifdef cl_khr_fp16 | ||
| 2805 | int __ovld __cnfn isfinite(half); | ||
| 2806 | short2 __ovld __cnfn isfinite(half2); | ||
| 2807 | @@ -10819,14 +10832,14 @@ int3 __ovld __cnfn isinf(float3); | ||
| 2808 | int4 __ovld __cnfn isinf(float4); | ||
| 2809 | int8 __ovld __cnfn isinf(float8); | ||
| 2810 | int16 __ovld __cnfn isinf(float16); | ||
| 2811 | -#ifdef cl_khr_fp64 | ||
| 2812 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2813 | int __ovld __cnfn isinf(double); | ||
| 2814 | long2 __ovld __cnfn isinf(double2); | ||
| 2815 | long3 __ovld __cnfn isinf(double3); | ||
| 2816 | long4 __ovld __cnfn isinf(double4); | ||
| 2817 | long8 __ovld __cnfn isinf(double8); | ||
| 2818 | long16 __ovld __cnfn isinf(double16); | ||
| 2819 | -#endif //cl_khr_fp64 | ||
| 2820 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2821 | #ifdef cl_khr_fp16 | ||
| 2822 | int __ovld __cnfn isinf(half); | ||
| 2823 | short2 __ovld __cnfn isinf(half2); | ||
| 2824 | @@ -10845,14 +10858,14 @@ int3 __ovld __cnfn isnan(float3); | ||
| 2825 | int4 __ovld __cnfn isnan(float4); | ||
| 2826 | int8 __ovld __cnfn isnan(float8); | ||
| 2827 | int16 __ovld __cnfn isnan(float16); | ||
| 2828 | -#ifdef cl_khr_fp64 | ||
| 2829 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2830 | int __ovld __cnfn isnan(double); | ||
| 2831 | long2 __ovld __cnfn isnan(double2); | ||
| 2832 | long3 __ovld __cnfn isnan(double3); | ||
| 2833 | long4 __ovld __cnfn isnan(double4); | ||
| 2834 | long8 __ovld __cnfn isnan(double8); | ||
| 2835 | long16 __ovld __cnfn isnan(double16); | ||
| 2836 | -#endif //cl_khr_fp64 | ||
| 2837 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2838 | #ifdef cl_khr_fp16 | ||
| 2839 | int __ovld __cnfn isnan(half); | ||
| 2840 | short2 __ovld __cnfn isnan(half2); | ||
| 2841 | @@ -10871,14 +10884,14 @@ int3 __ovld __cnfn isnormal(float3); | ||
| 2842 | int4 __ovld __cnfn isnormal(float4); | ||
| 2843 | int8 __ovld __cnfn isnormal(float8); | ||
| 2844 | int16 __ovld __cnfn isnormal(float16); | ||
| 2845 | -#ifdef cl_khr_fp64 | ||
| 2846 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2847 | int __ovld __cnfn isnormal(double); | ||
| 2848 | long2 __ovld __cnfn isnormal(double2); | ||
| 2849 | long3 __ovld __cnfn isnormal(double3); | ||
| 2850 | long4 __ovld __cnfn isnormal(double4); | ||
| 2851 | long8 __ovld __cnfn isnormal(double8); | ||
| 2852 | long16 __ovld __cnfn isnormal(double16); | ||
| 2853 | -#endif //cl_khr_fp64 | ||
| 2854 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2855 | #ifdef cl_khr_fp16 | ||
| 2856 | int __ovld __cnfn isnormal(half); | ||
| 2857 | short2 __ovld __cnfn isnormal(half2); | ||
| 2858 | @@ -10899,14 +10912,14 @@ int3 __ovld __cnfn isordered(float3 x, float3 y); | ||
| 2859 | int4 __ovld __cnfn isordered(float4 x, float4 y); | ||
| 2860 | int8 __ovld __cnfn isordered(float8 x, float8 y); | ||
| 2861 | int16 __ovld __cnfn isordered(float16 x, float16 y); | ||
| 2862 | -#ifdef cl_khr_fp64 | ||
| 2863 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2864 | int __ovld __cnfn isordered(double x, double y); | ||
| 2865 | long2 __ovld __cnfn isordered(double2 x, double2 y); | ||
| 2866 | long3 __ovld __cnfn isordered(double3 x, double3 y); | ||
| 2867 | long4 __ovld __cnfn isordered(double4 x, double4 y); | ||
| 2868 | long8 __ovld __cnfn isordered(double8 x, double8 y); | ||
| 2869 | long16 __ovld __cnfn isordered(double16 x, double16 y); | ||
| 2870 | -#endif //cl_khr_fp64 | ||
| 2871 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2872 | #ifdef cl_khr_fp16 | ||
| 2873 | int __ovld __cnfn isordered(half x, half y); | ||
| 2874 | short2 __ovld __cnfn isordered(half2 x, half2 y); | ||
| 2875 | @@ -10927,14 +10940,14 @@ int3 __ovld __cnfn isunordered(float3 x, float3 y); | ||
| 2876 | int4 __ovld __cnfn isunordered(float4 x, float4 y); | ||
| 2877 | int8 __ovld __cnfn isunordered(float8 x, float8 y); | ||
| 2878 | int16 __ovld __cnfn isunordered(float16 x, float16 y); | ||
| 2879 | -#ifdef cl_khr_fp64 | ||
| 2880 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2881 | int __ovld __cnfn isunordered(double x, double y); | ||
| 2882 | long2 __ovld __cnfn isunordered(double2 x, double2 y); | ||
| 2883 | long3 __ovld __cnfn isunordered(double3 x, double3 y); | ||
| 2884 | long4 __ovld __cnfn isunordered(double4 x, double4 y); | ||
| 2885 | long8 __ovld __cnfn isunordered(double8 x, double8 y); | ||
| 2886 | long16 __ovld __cnfn isunordered(double16 x, double16 y); | ||
| 2887 | -#endif //cl_khr_fp64 | ||
| 2888 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2889 | #ifdef cl_khr_fp16 | ||
| 2890 | int __ovld __cnfn isunordered(half x, half y); | ||
| 2891 | short2 __ovld __cnfn isunordered(half2 x, half2 y); | ||
| 2892 | @@ -10957,14 +10970,14 @@ int3 __ovld __cnfn signbit(float3); | ||
| 2893 | int4 __ovld __cnfn signbit(float4); | ||
| 2894 | int8 __ovld __cnfn signbit(float8); | ||
| 2895 | int16 __ovld __cnfn signbit(float16); | ||
| 2896 | -#ifdef cl_khr_fp64 | ||
| 2897 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2898 | int __ovld __cnfn signbit(double); | ||
| 2899 | long2 __ovld __cnfn signbit(double2); | ||
| 2900 | long3 __ovld __cnfn signbit(double3); | ||
| 2901 | long4 __ovld __cnfn signbit(double4); | ||
| 2902 | long8 __ovld __cnfn signbit(double8); | ||
| 2903 | long16 __ovld __cnfn signbit(double16); | ||
| 2904 | -#endif //cl_khr_fp64 | ||
| 2905 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2906 | #ifdef cl_khr_fp16 | ||
| 2907 | int __ovld __cnfn signbit(half); | ||
| 2908 | short2 __ovld __cnfn signbit(half2); | ||
| 2909 | @@ -11091,14 +11104,14 @@ float3 __ovld __cnfn bitselect(float3 a, float3 b, float3 c); | ||
| 2910 | float4 __ovld __cnfn bitselect(float4 a, float4 b, float4 c); | ||
| 2911 | float8 __ovld __cnfn bitselect(float8 a, float8 b, float8 c); | ||
| 2912 | float16 __ovld __cnfn bitselect(float16 a, float16 b, float16 c); | ||
| 2913 | -#ifdef cl_khr_fp64 | ||
| 2914 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2915 | double __ovld __cnfn bitselect(double a, double b, double c); | ||
| 2916 | double2 __ovld __cnfn bitselect(double2 a, double2 b, double2 c); | ||
| 2917 | double3 __ovld __cnfn bitselect(double3 a, double3 b, double3 c); | ||
| 2918 | double4 __ovld __cnfn bitselect(double4 a, double4 b, double4 c); | ||
| 2919 | double8 __ovld __cnfn bitselect(double8 a, double8 b, double8 c); | ||
| 2920 | double16 __ovld __cnfn bitselect(double16 a, double16 b, double16 c); | ||
| 2921 | -#endif //cl_khr_fp64 | ||
| 2922 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2923 | #ifdef cl_khr_fp16 | ||
| 2924 | half __ovld __cnfn bitselect(half a, half b, half c); | ||
| 2925 | half2 __ovld __cnfn bitselect(half2 a, half2 b, half2 c); | ||
| 2926 | @@ -11231,7 +11244,7 @@ ulong8 __ovld __cnfn select(ulong8 a, ulong8 b, ulong8 c); | ||
| 2927 | long16 __ovld __cnfn select(long16 a, long16 b, ulong16 c); | ||
| 2928 | ulong16 __ovld __cnfn select(ulong16 a, ulong16 b, ulong16 c); | ||
| 2929 | |||
| 2930 | -#ifdef cl_khr_fp64 | ||
| 2931 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2932 | double __ovld __cnfn select(double a, double b, long c); | ||
| 2933 | double2 __ovld __cnfn select(double2 a, double2 b, long2 c); | ||
| 2934 | double3 __ovld __cnfn select(double3 a, double3 b, long3 c); | ||
| 2935 | @@ -11244,7 +11257,7 @@ double3 __ovld __cnfn select(double3 a, double3 b, ulong3 c); | ||
| 2936 | double4 __ovld __cnfn select(double4 a, double4 b, ulong4 c); | ||
| 2937 | double8 __ovld __cnfn select(double8 a, double8 b, ulong8 c); | ||
| 2938 | double16 __ovld __cnfn select(double16 a, double16 b, ulong16 c); | ||
| 2939 | -#endif //cl_khr_fp64 | ||
| 2940 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2941 | #ifdef cl_khr_fp16 | ||
| 2942 | half __ovld __cnfn select(half a, half b, short c); | ||
| 2943 | half2 __ovld __cnfn select(half2 a, half2 b, short2 c); | ||
| 2944 | @@ -11323,13 +11336,13 @@ uint16 __ovld vload16(size_t offset, const __constant uint *p); | ||
| 2945 | long16 __ovld vload16(size_t offset, const __constant long *p); | ||
| 2946 | ulong16 __ovld vload16(size_t offset, const __constant ulong *p); | ||
| 2947 | float16 __ovld vload16(size_t offset, const __constant float *p); | ||
| 2948 | -#ifdef cl_khr_fp64 | ||
| 2949 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2950 | double2 __ovld vload2(size_t offset, const __constant double *p); | ||
| 2951 | double3 __ovld vload3(size_t offset, const __constant double *p); | ||
| 2952 | double4 __ovld vload4(size_t offset, const __constant double *p); | ||
| 2953 | double8 __ovld vload8(size_t offset, const __constant double *p); | ||
| 2954 | double16 __ovld vload16(size_t offset, const __constant double *p); | ||
| 2955 | -#endif //cl_khr_fp64 | ||
| 2956 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2957 | |||
| 2958 | #ifdef cl_khr_fp16 | ||
| 2959 | half __ovld vload(size_t offset, const __constant half *p); | ||
| 2960 | @@ -11340,7 +11353,7 @@ half8 __ovld vload8(size_t offset, const __constant half *p); | ||
| 2961 | half16 __ovld vload16(size_t offset, const __constant half *p); | ||
| 2962 | #endif //cl_khr_fp16 | ||
| 2963 | |||
| 2964 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 2965 | +#ifdef __opencl_c_generic_address_space | ||
| 2966 | char2 __ovld vload2(size_t offset, const char *p); | ||
| 2967 | uchar2 __ovld vload2(size_t offset, const uchar *p); | ||
| 2968 | short2 __ovld vload2(size_t offset, const short *p); | ||
| 2969 | @@ -11387,13 +11400,13 @@ long16 __ovld vload16(size_t offset, const long *p); | ||
| 2970 | ulong16 __ovld vload16(size_t offset, const ulong *p); | ||
| 2971 | float16 __ovld vload16(size_t offset, const float *p); | ||
| 2972 | |||
| 2973 | -#ifdef cl_khr_fp64 | ||
| 2974 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2975 | double2 __ovld vload2(size_t offset, const double *p); | ||
| 2976 | double3 __ovld vload3(size_t offset, const double *p); | ||
| 2977 | double4 __ovld vload4(size_t offset, const double *p); | ||
| 2978 | double8 __ovld vload8(size_t offset, const double *p); | ||
| 2979 | double16 __ovld vload16(size_t offset, const double *p); | ||
| 2980 | -#endif //cl_khr_fp64 | ||
| 2981 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 2982 | |||
| 2983 | #ifdef cl_khr_fp16 | ||
| 2984 | half __ovld vload(size_t offset, const half *p); | ||
| 2985 | @@ -11403,7 +11416,7 @@ half4 __ovld vload4(size_t offset, const half *p); | ||
| 2986 | half8 __ovld vload8(size_t offset, const half *p); | ||
| 2987 | half16 __ovld vload16(size_t offset, const half *p); | ||
| 2988 | #endif //cl_khr_fp16 | ||
| 2989 | -#else | ||
| 2990 | +#endif //__opencl_c_generic_address_space | ||
| 2991 | char2 __ovld vload2(size_t offset, const __global char *p); | ||
| 2992 | uchar2 __ovld vload2(size_t offset, const __global uchar *p); | ||
| 2993 | short2 __ovld vload2(size_t offset, const __global short *p); | ||
| 2994 | @@ -11540,7 +11553,7 @@ long16 __ovld vload16(size_t offset, const __private long *p); | ||
| 2995 | ulong16 __ovld vload16(size_t offset, const __private ulong *p); | ||
| 2996 | float16 __ovld vload16(size_t offset, const __private float *p); | ||
| 2997 | |||
| 2998 | -#ifdef cl_khr_fp64 | ||
| 2999 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3000 | double2 __ovld vload2(size_t offset, const __global double *p); | ||
| 3001 | double3 __ovld vload3(size_t offset, const __global double *p); | ||
| 3002 | double4 __ovld vload4(size_t offset, const __global double *p); | ||
| 3003 | @@ -11556,7 +11569,7 @@ double3 __ovld vload3(size_t offset, const __private double *p); | ||
| 3004 | double4 __ovld vload4(size_t offset, const __private double *p); | ||
| 3005 | double8 __ovld vload8(size_t offset, const __private double *p); | ||
| 3006 | double16 __ovld vload16(size_t offset, const __private double *p); | ||
| 3007 | -#endif //cl_khr_fp64 | ||
| 3008 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3009 | |||
| 3010 | #ifdef cl_khr_fp16 | ||
| 3011 | half __ovld vload(size_t offset, const __global half *p); | ||
| 3012 | @@ -11578,9 +11591,8 @@ half4 __ovld vload4(size_t offset, const __private half *p); | ||
| 3013 | half8 __ovld vload8(size_t offset, const __private half *p); | ||
| 3014 | half16 __ovld vload16(size_t offset, const __private half *p); | ||
| 3015 | #endif //cl_khr_fp16 | ||
| 3016 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3017 | |||
| 3018 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3019 | +#ifdef __opencl_c_generic_address_space | ||
| 3020 | void __ovld vstore2(char2 data, size_t offset, char *p); | ||
| 3021 | void __ovld vstore2(uchar2 data, size_t offset, uchar *p); | ||
| 3022 | void __ovld vstore2(short2 data, size_t offset, short *p); | ||
| 3023 | @@ -11626,13 +11638,13 @@ void __ovld vstore16(uint16 data, size_t offset, uint *p); | ||
| 3024 | void __ovld vstore16(long16 data, size_t offset, long *p); | ||
| 3025 | void __ovld vstore16(ulong16 data, size_t offset, ulong *p); | ||
| 3026 | void __ovld vstore16(float16 data, size_t offset, float *p); | ||
| 3027 | -#ifdef cl_khr_fp64 | ||
| 3028 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3029 | void __ovld vstore2(double2 data, size_t offset, double *p); | ||
| 3030 | void __ovld vstore3(double3 data, size_t offset, double *p); | ||
| 3031 | void __ovld vstore4(double4 data, size_t offset, double *p); | ||
| 3032 | void __ovld vstore8(double8 data, size_t offset, double *p); | ||
| 3033 | void __ovld vstore16(double16 data, size_t offset, double *p); | ||
| 3034 | -#endif //cl_khr_fp64 | ||
| 3035 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3036 | #ifdef cl_khr_fp16 | ||
| 3037 | void __ovld vstore(half data, size_t offset, half *p); | ||
| 3038 | void __ovld vstore2(half2 data, size_t offset, half *p); | ||
| 3039 | @@ -11641,7 +11653,7 @@ void __ovld vstore4(half4 data, size_t offset, half *p); | ||
| 3040 | void __ovld vstore8(half8 data, size_t offset, half *p); | ||
| 3041 | void __ovld vstore16(half16 data, size_t offset, half *p); | ||
| 3042 | #endif //cl_khr_fp16 | ||
| 3043 | -#else | ||
| 3044 | +#endif //__opencl_c_generic_address_space | ||
| 3045 | void __ovld vstore2(char2 data, size_t offset, __global char *p); | ||
| 3046 | void __ovld vstore2(uchar2 data, size_t offset, __global uchar *p); | ||
| 3047 | void __ovld vstore2(short2 data, size_t offset, __global short *p); | ||
| 3048 | @@ -11777,7 +11789,7 @@ void __ovld vstore16(uint16 data, size_t offset, __private uint *p); | ||
| 3049 | void __ovld vstore16(long16 data, size_t offset, __private long *p); | ||
| 3050 | void __ovld vstore16(ulong16 data, size_t offset, __private ulong *p); | ||
| 3051 | void __ovld vstore16(float16 data, size_t offset, __private float *p); | ||
| 3052 | -#ifdef cl_khr_fp64 | ||
| 3053 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3054 | void __ovld vstore2(double2 data, size_t offset, __global double *p); | ||
| 3055 | void __ovld vstore3(double3 data, size_t offset, __global double *p); | ||
| 3056 | void __ovld vstore4(double4 data, size_t offset, __global double *p); | ||
| 3057 | @@ -11793,7 +11805,7 @@ void __ovld vstore3(double3 data, size_t offset, __private double *p); | ||
| 3058 | void __ovld vstore4(double4 data, size_t offset, __private double *p); | ||
| 3059 | void __ovld vstore8(double8 data, size_t offset, __private double *p); | ||
| 3060 | void __ovld vstore16(double16 data, size_t offset, __private double *p); | ||
| 3061 | -#endif //cl_khr_fp64 | ||
| 3062 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3063 | #ifdef cl_khr_fp16 | ||
| 3064 | void __ovld vstore(half data, size_t offset, __global half *p); | ||
| 3065 | void __ovld vstore2(half2 data, size_t offset, __global half *p); | ||
| 3066 | @@ -11814,7 +11826,6 @@ void __ovld vstore4(half4 data, size_t offset, __private half *p); | ||
| 3067 | void __ovld vstore8(half8 data, size_t offset, __private half *p); | ||
| 3068 | void __ovld vstore16(half16 data, size_t offset, __private half *p); | ||
| 3069 | #endif //cl_khr_fp16 | ||
| 3070 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3071 | |||
| 3072 | /** | ||
| 3073 | * Read sizeof (half) bytes of data from address | ||
| 3074 | @@ -11825,13 +11836,12 @@ void __ovld vstore16(half16 data, size_t offset, __private half *p); | ||
| 3075 | * must be 16-bit aligned. | ||
| 3076 | */ | ||
| 3077 | float __ovld vload_half(size_t offset, const __constant half *p); | ||
| 3078 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3079 | +#ifdef __opencl_c_generic_address_space | ||
| 3080 | float __ovld vload_half(size_t offset, const half *p); | ||
| 3081 | -#else | ||
| 3082 | +#endif //__opencl_c_generic_address_space | ||
| 3083 | float __ovld vload_half(size_t offset, const __global half *p); | ||
| 3084 | float __ovld vload_half(size_t offset, const __local half *p); | ||
| 3085 | float __ovld vload_half(size_t offset, const __private half *p); | ||
| 3086 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3087 | |||
| 3088 | /** | ||
| 3089 | * Read sizeof (halfn) bytes of data from address | ||
| 3090 | @@ -11846,13 +11856,13 @@ float3 __ovld vload_half3(size_t offset, const __constant half *p); | ||
| 3091 | float4 __ovld vload_half4(size_t offset, const __constant half *p); | ||
| 3092 | float8 __ovld vload_half8(size_t offset, const __constant half *p); | ||
| 3093 | float16 __ovld vload_half16(size_t offset, const __constant half *p); | ||
| 3094 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3095 | +#ifdef __opencl_c_generic_address_space | ||
| 3096 | float2 __ovld vload_half2(size_t offset, const half *p); | ||
| 3097 | float3 __ovld vload_half3(size_t offset, const half *p); | ||
| 3098 | float4 __ovld vload_half4(size_t offset, const half *p); | ||
| 3099 | float8 __ovld vload_half8(size_t offset, const half *p); | ||
| 3100 | float16 __ovld vload_half16(size_t offset, const half *p); | ||
| 3101 | -#else | ||
| 3102 | +#endif //__opencl_c_generic_address_space | ||
| 3103 | float2 __ovld vload_half2(size_t offset, const __global half *p); | ||
| 3104 | float3 __ovld vload_half3(size_t offset, const __global half *p); | ||
| 3105 | float4 __ovld vload_half4(size_t offset, const __global half *p); | ||
| 3106 | @@ -11868,7 +11878,6 @@ float3 __ovld vload_half3(size_t offset, const __private half *p); | ||
| 3107 | float4 __ovld vload_half4(size_t offset, const __private half *p); | ||
| 3108 | float8 __ovld vload_half8(size_t offset, const __private half *p); | ||
| 3109 | float16 __ovld vload_half16(size_t offset, const __private half *p); | ||
| 3110 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3111 | |||
| 3112 | /** | ||
| 3113 | * The float value given by data is first | ||
| 3114 | @@ -11881,20 +11890,20 @@ float16 __ovld vload_half16(size_t offset, const __private half *p); | ||
| 3115 | * The default current rounding mode is round to | ||
| 3116 | * nearest even. | ||
| 3117 | */ | ||
| 3118 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3119 | +#ifdef __opencl_c_generic_address_space | ||
| 3120 | void __ovld vstore_half(float data, size_t offset, half *p); | ||
| 3121 | void __ovld vstore_half_rte(float data, size_t offset, half *p); | ||
| 3122 | void __ovld vstore_half_rtz(float data, size_t offset, half *p); | ||
| 3123 | void __ovld vstore_half_rtp(float data, size_t offset, half *p); | ||
| 3124 | void __ovld vstore_half_rtn(float data, size_t offset, half *p); | ||
| 3125 | -#ifdef cl_khr_fp64 | ||
| 3126 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3127 | void __ovld vstore_half(double data, size_t offset, half *p); | ||
| 3128 | void __ovld vstore_half_rte(double data, size_t offset, half *p); | ||
| 3129 | void __ovld vstore_half_rtz(double data, size_t offset, half *p); | ||
| 3130 | void __ovld vstore_half_rtp(double data, size_t offset, half *p); | ||
| 3131 | void __ovld vstore_half_rtn(double data, size_t offset, half *p); | ||
| 3132 | -#endif //cl_khr_fp64 | ||
| 3133 | -#else | ||
| 3134 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3135 | +#endif //__opencl_c_generic_address_space | ||
| 3136 | void __ovld vstore_half(float data, size_t offset, __global half *p); | ||
| 3137 | void __ovld vstore_half_rte(float data, size_t offset, __global half *p); | ||
| 3138 | void __ovld vstore_half_rtz(float data, size_t offset, __global half *p); | ||
| 3139 | @@ -11910,7 +11919,7 @@ void __ovld vstore_half_rte(float data, size_t offset, __private half *p); | ||
| 3140 | void __ovld vstore_half_rtz(float data, size_t offset, __private half *p); | ||
| 3141 | void __ovld vstore_half_rtp(float data, size_t offset, __private half *p); | ||
| 3142 | void __ovld vstore_half_rtn(float data, size_t offset, __private half *p); | ||
| 3143 | -#ifdef cl_khr_fp64 | ||
| 3144 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3145 | void __ovld vstore_half(double data, size_t offset, __global half *p); | ||
| 3146 | void __ovld vstore_half_rte(double data, size_t offset, __global half *p); | ||
| 3147 | void __ovld vstore_half_rtz(double data, size_t offset, __global half *p); | ||
| 3148 | @@ -11926,8 +11935,7 @@ void __ovld vstore_half_rte(double data, size_t offset, __private half *p); | ||
| 3149 | void __ovld vstore_half_rtz(double data, size_t offset, __private half *p); | ||
| 3150 | void __ovld vstore_half_rtp(double data, size_t offset, __private half *p); | ||
| 3151 | void __ovld vstore_half_rtn(double data, size_t offset, __private half *p); | ||
| 3152 | -#endif //cl_khr_fp64 | ||
| 3153 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3154 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3155 | |||
| 3156 | /** | ||
| 3157 | * The floatn value given by data is converted to | ||
| 3158 | @@ -11940,7 +11948,7 @@ void __ovld vstore_half_rtn(double data, size_t offset, __private half *p); | ||
| 3159 | * The default current rounding mode is round to | ||
| 3160 | * nearest even. | ||
| 3161 | */ | ||
| 3162 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3163 | +#ifdef __opencl_c_generic_address_space | ||
| 3164 | void __ovld vstore_half2(float2 data, size_t offset, half *p); | ||
| 3165 | void __ovld vstore_half3(float3 data, size_t offset, half *p); | ||
| 3166 | void __ovld vstore_half4(float4 data, size_t offset, half *p); | ||
| 3167 | @@ -11966,7 +11974,7 @@ void __ovld vstore_half3_rtn(float3 data, size_t offset, half *p); | ||
| 3168 | void __ovld vstore_half4_rtn(float4 data, size_t offset, half *p); | ||
| 3169 | void __ovld vstore_half8_rtn(float8 data, size_t offset, half *p); | ||
| 3170 | void __ovld vstore_half16_rtn(float16 data, size_t offset, half *p); | ||
| 3171 | -#ifdef cl_khr_fp64 | ||
| 3172 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3173 | void __ovld vstore_half2(double2 data, size_t offset, half *p); | ||
| 3174 | void __ovld vstore_half3(double3 data, size_t offset, half *p); | ||
| 3175 | void __ovld vstore_half4(double4 data, size_t offset, half *p); | ||
| 3176 | @@ -11992,8 +12000,8 @@ void __ovld vstore_half3_rtn(double3 data, size_t offset, half *p); | ||
| 3177 | void __ovld vstore_half4_rtn(double4 data, size_t offset, half *p); | ||
| 3178 | void __ovld vstore_half8_rtn(double8 data, size_t offset, half *p); | ||
| 3179 | void __ovld vstore_half16_rtn(double16 data, size_t offset, half *p); | ||
| 3180 | -#endif //cl_khr_fp64 | ||
| 3181 | -#else | ||
| 3182 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3183 | +#endif //__opencl_c_generic_address_space | ||
| 3184 | void __ovld vstore_half2(float2 data, size_t offset, __global half *p); | ||
| 3185 | void __ovld vstore_half3(float3 data, size_t offset, __global half *p); | ||
| 3186 | void __ovld vstore_half4(float4 data, size_t offset, __global half *p); | ||
| 3187 | @@ -12069,7 +12077,7 @@ void __ovld vstore_half3_rtn(float3 data, size_t offset, __private half *p); | ||
| 3188 | void __ovld vstore_half4_rtn(float4 data, size_t offset, __private half *p); | ||
| 3189 | void __ovld vstore_half8_rtn(float8 data, size_t offset, __private half *p); | ||
| 3190 | void __ovld vstore_half16_rtn(float16 data, size_t offset, __private half *p); | ||
| 3191 | -#ifdef cl_khr_fp64 | ||
| 3192 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3193 | void __ovld vstore_half2(double2 data, size_t offset, __global half *p); | ||
| 3194 | void __ovld vstore_half3(double3 data, size_t offset, __global half *p); | ||
| 3195 | void __ovld vstore_half4(double4 data, size_t offset, __global half *p); | ||
| 3196 | @@ -12145,8 +12153,7 @@ void __ovld vstore_half3_rtn(double3 data, size_t offset, __private half *p); | ||
| 3197 | void __ovld vstore_half4_rtn(double4 data, size_t offset, __private half *p); | ||
| 3198 | void __ovld vstore_half8_rtn(double8 data, size_t offset, __private half *p); | ||
| 3199 | void __ovld vstore_half16_rtn(double16 data, size_t offset, __private half *p); | ||
| 3200 | -#endif //cl_khr_fp64 | ||
| 3201 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3202 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3203 | |||
| 3204 | /** | ||
| 3205 | * For n = 1, 2, 4, 8 and 16 read sizeof (halfn) | ||
| 3206 | @@ -12167,14 +12174,14 @@ float3 __ovld vloada_half3(size_t offset, const __constant half *p); | ||
| 3207 | float4 __ovld vloada_half4(size_t offset, const __constant half *p); | ||
| 3208 | float8 __ovld vloada_half8(size_t offset, const __constant half *p); | ||
| 3209 | float16 __ovld vloada_half16(size_t offset, const __constant half *p); | ||
| 3210 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3211 | +#ifdef __opencl_c_generic_address_space | ||
| 3212 | float __ovld vloada_half(size_t offset, const half *p); | ||
| 3213 | float2 __ovld vloada_half2(size_t offset, const half *p); | ||
| 3214 | float3 __ovld vloada_half3(size_t offset, const half *p); | ||
| 3215 | float4 __ovld vloada_half4(size_t offset, const half *p); | ||
| 3216 | float8 __ovld vloada_half8(size_t offset, const half *p); | ||
| 3217 | float16 __ovld vloada_half16(size_t offset, const half *p); | ||
| 3218 | -#else | ||
| 3219 | +#endif //__opencl_c_generic_address_space | ||
| 3220 | float __ovld vloada_half(size_t offset, const __global half *p); | ||
| 3221 | float2 __ovld vloada_half2(size_t offset, const __global half *p); | ||
| 3222 | float3 __ovld vloada_half3(size_t offset, const __global half *p); | ||
| 3223 | @@ -12193,7 +12200,6 @@ float3 __ovld vloada_half3(size_t offset, const __private half *p); | ||
| 3224 | float4 __ovld vloada_half4(size_t offset, const __private half *p); | ||
| 3225 | float8 __ovld vloada_half8(size_t offset, const __private half *p); | ||
| 3226 | float16 __ovld vloada_half16(size_t offset, const __private half *p); | ||
| 3227 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3228 | |||
| 3229 | /** | ||
| 3230 | * The floatn value given by data is converted to | ||
| 3231 | @@ -12211,7 +12217,7 @@ float16 __ovld vloada_half16(size_t offset, const __private half *p); | ||
| 3232 | * mode. The default current rounding mode is | ||
| 3233 | * round to nearest even. | ||
| 3234 | */ | ||
| 3235 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3236 | +#ifdef __opencl_c_generic_address_space | ||
| 3237 | void __ovld vstorea_half(float data, size_t offset, half *p); | ||
| 3238 | void __ovld vstorea_half2(float2 data, size_t offset, half *p); | ||
| 3239 | void __ovld vstorea_half3(float3 data, size_t offset, half *p); | ||
| 3240 | @@ -12247,7 +12253,7 @@ void __ovld vstorea_half4_rtn(float4 data, size_t offset, half *p); | ||
| 3241 | void __ovld vstorea_half8_rtn(float8 data, size_t offset, half *p); | ||
| 3242 | void __ovld vstorea_half16_rtn(float16 data, size_t offset, half *p); | ||
| 3243 | |||
| 3244 | -#ifdef cl_khr_fp64 | ||
| 3245 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3246 | void __ovld vstorea_half(double data, size_t offset, half *p); | ||
| 3247 | void __ovld vstorea_half2(double2 data, size_t offset, half *p); | ||
| 3248 | void __ovld vstorea_half3(double3 data, size_t offset, half *p); | ||
| 3249 | @@ -12282,9 +12288,9 @@ void __ovld vstorea_half3_rtn(double3 data, size_t offset, half *p); | ||
| 3250 | void __ovld vstorea_half4_rtn(double4 data, size_t offset, half *p); | ||
| 3251 | void __ovld vstorea_half8_rtn(double8 data, size_t offset, half *p); | ||
| 3252 | void __ovld vstorea_half16_rtn(double16 data, size_t offset, half *p); | ||
| 3253 | -#endif //cl_khr_fp64 | ||
| 3254 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3255 | +#endif //__opencl_c_generic_address_space | ||
| 3256 | |||
| 3257 | -#else | ||
| 3258 | void __ovld vstorea_half(float data, size_t offset, __global half *p); | ||
| 3259 | void __ovld vstorea_half2(float2 data, size_t offset, __global half *p); | ||
| 3260 | void __ovld vstorea_half3(float3 data, size_t offset, __global half *p); | ||
| 3261 | @@ -12390,7 +12396,7 @@ void __ovld vstorea_half4_rtn(float4 data, size_t offset, __private half *p); | ||
| 3262 | void __ovld vstorea_half8_rtn(float8 data, size_t offset, __private half *p); | ||
| 3263 | void __ovld vstorea_half16_rtn(float16 data, size_t offset, __private half *p); | ||
| 3264 | |||
| 3265 | -#ifdef cl_khr_fp64 | ||
| 3266 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3267 | void __ovld vstorea_half(double data, size_t offset, __global half *p); | ||
| 3268 | void __ovld vstorea_half2(double2 data, size_t offset, __global half *p); | ||
| 3269 | void __ovld vstorea_half3(double3 data, size_t offset, __global half *p); | ||
| 3270 | @@ -12495,8 +12501,7 @@ void __ovld vstorea_half3_rtn(double3 data,size_t offset, __private half *p); | ||
| 3271 | void __ovld vstorea_half4_rtn(double4 data,size_t offset, __private half *p); | ||
| 3272 | void __ovld vstorea_half8_rtn(double8 data,size_t offset, __private half *p); | ||
| 3273 | void __ovld vstorea_half16_rtn(double16 data,size_t offset, __private half *p); | ||
| 3274 | -#endif //cl_khr_fp64 | ||
| 3275 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3276 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3277 | |||
| 3278 | // OpenCL v1.1 s6.11.8, v1.2 s6.12.8, v2.0 s6.13.8 - Synchronization Functions | ||
| 3279 | |||
| 3280 | @@ -12580,7 +12585,7 @@ void __ovld write_mem_fence(cl_mem_fence_flags flags); | ||
| 3281 | |||
| 3282 | // OpenCL v2.0 s6.13.9 - Address Space Qualifier Functions | ||
| 3283 | |||
| 3284 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3285 | +#ifdef __opencl_c_generic_address_space | ||
| 3286 | cl_mem_fence_flags __ovld get_fence(const void *ptr); | ||
| 3287 | cl_mem_fence_flags __ovld get_fence(void *ptr); | ||
| 3288 | |||
| 3289 | @@ -12591,7 +12596,7 @@ cl_mem_fence_flags __ovld get_fence(void *ptr); | ||
| 3290 | * where gentype is builtin type or user defined type. | ||
| 3291 | */ | ||
| 3292 | |||
| 3293 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 3294 | +#endif //__opencl_c_generic_address_space | ||
| 3295 | |||
| 3296 | // OpenCL v1.1 s6.11.10, v1.2 s6.12.10, v2.0 s6.13.10 - Async Copies from Global to Local Memory, Local to Global Memory, and Prefetch | ||
| 3297 | |||
| 3298 | @@ -12730,7 +12735,7 @@ event_t __ovld async_work_group_copy(__global uint16 *dst, const __local uint16 | ||
| 3299 | event_t __ovld async_work_group_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, event_t event); | ||
| 3300 | event_t __ovld async_work_group_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, event_t event); | ||
| 3301 | event_t __ovld async_work_group_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, event_t event); | ||
| 3302 | -#ifdef cl_khr_fp64 | ||
| 3303 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3304 | event_t __ovld async_work_group_copy(__local double *dst, const __global double *src, size_t num_elements, event_t event); | ||
| 3305 | event_t __ovld async_work_group_copy(__local double2 *dst, const __global double2 *src, size_t num_elements, event_t event); | ||
| 3306 | event_t __ovld async_work_group_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, event_t event); | ||
| 3307 | @@ -12743,7 +12748,7 @@ event_t __ovld async_work_group_copy(__global double3 *dst, const __local double | ||
| 3308 | event_t __ovld async_work_group_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, event_t event); | ||
| 3309 | event_t __ovld async_work_group_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, event_t event); | ||
| 3310 | event_t __ovld async_work_group_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, event_t event); | ||
| 3311 | -#endif //cl_khr_fp64 | ||
| 3312 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3313 | #ifdef cl_khr_fp16 | ||
| 3314 | event_t __ovld async_work_group_copy(__local half *dst, const __global half *src, size_t num_elements, event_t event); | ||
| 3315 | event_t __ovld async_work_group_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, event_t event); | ||
| 3316 | @@ -12893,7 +12898,7 @@ event_t __ovld async_work_group_strided_copy(__global uint16 *dst, const __local | ||
| 3317 | event_t __ovld async_work_group_strided_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3318 | event_t __ovld async_work_group_strided_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3319 | event_t __ovld async_work_group_strided_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3320 | -#ifdef cl_khr_fp64 | ||
| 3321 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3322 | event_t __ovld async_work_group_strided_copy(__local double *dst, const __global double *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3323 | event_t __ovld async_work_group_strided_copy(__local double2 *dst, const __global double2 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3324 | event_t __ovld async_work_group_strided_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3325 | @@ -12906,7 +12911,7 @@ event_t __ovld async_work_group_strided_copy(__global double3 *dst, const __loca | ||
| 3326 | event_t __ovld async_work_group_strided_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3327 | event_t __ovld async_work_group_strided_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3328 | event_t __ovld async_work_group_strided_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, size_t dst_stride, event_t event); | ||
| 3329 | -#endif //cl_khr_fp64 | ||
| 3330 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3331 | #ifdef cl_khr_fp16 | ||
| 3332 | event_t __ovld async_work_group_strided_copy(__local half *dst, const __global half *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3333 | event_t __ovld async_work_group_strided_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, size_t src_stride, event_t event); | ||
| 3334 | @@ -12996,14 +13001,14 @@ void __ovld prefetch(const __global uint16 *p, size_t num_elements); | ||
| 3335 | void __ovld prefetch(const __global long16 *p, size_t num_elements); | ||
| 3336 | void __ovld prefetch(const __global ulong16 *p, size_t num_elements); | ||
| 3337 | void __ovld prefetch(const __global float16 *p, size_t num_elements); | ||
| 3338 | -#ifdef cl_khr_fp64 | ||
| 3339 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3340 | void __ovld prefetch(const __global double *p, size_t num_elements); | ||
| 3341 | void __ovld prefetch(const __global double2 *p, size_t num_elements); | ||
| 3342 | void __ovld prefetch(const __global double3 *p, size_t num_elements); | ||
| 3343 | void __ovld prefetch(const __global double4 *p, size_t num_elements); | ||
| 3344 | void __ovld prefetch(const __global double8 *p, size_t num_elements); | ||
| 3345 | void __ovld prefetch(const __global double16 *p, size_t num_elements); | ||
| 3346 | -#endif //cl_khr_fp64 | ||
| 3347 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3348 | #ifdef cl_khr_fp16 | ||
| 3349 | void __ovld prefetch(const __global half *p, size_t num_elements); | ||
| 3350 | void __ovld prefetch(const __global half2 *p, size_t num_elements); | ||
| 3351 | @@ -13026,9 +13031,11 @@ void __ovld prefetch(const __global half16 *p, size_t num_elements); | ||
| 3352 | * pointed by p. The function returns old. | ||
| 3353 | */ | ||
| 3354 | int __ovld atomic_add(volatile __global int *p, int val); | ||
| 3355 | -unsigned int __ovld atomic_add(volatile __global unsigned int *p, unsigned int val); | ||
| 3356 | +unsigned int __ovld atomic_add(volatile __global unsigned int *p, | ||
| 3357 | + unsigned int val); | ||
| 3358 | int __ovld atomic_add(volatile __local int *p, int val); | ||
| 3359 | -unsigned int __ovld atomic_add(volatile __local unsigned int *p, unsigned int val); | ||
| 3360 | +unsigned int __ovld atomic_add(volatile __local unsigned int *p, | ||
| 3361 | + unsigned int val); | ||
| 3362 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3363 | int __ovld atomic_add(volatile int *p, int val); | ||
| 3364 | unsigned int __ovld atomic_add(volatile unsigned int *p, unsigned int val); | ||
| 3365 | @@ -13056,9 +13063,11 @@ unsigned long __ovld atom_add(volatile __local unsigned long *p, unsigned long v | ||
| 3366 | * returns old. | ||
| 3367 | */ | ||
| 3368 | int __ovld atomic_sub(volatile __global int *p, int val); | ||
| 3369 | -unsigned int __ovld atomic_sub(volatile __global unsigned int *p, unsigned int val); | ||
| 3370 | +unsigned int __ovld atomic_sub(volatile __global unsigned int *p, | ||
| 3371 | + unsigned int val); | ||
| 3372 | int __ovld atomic_sub(volatile __local int *p, int val); | ||
| 3373 | -unsigned int __ovld atomic_sub(volatile __local unsigned int *p, unsigned int val); | ||
| 3374 | +unsigned int __ovld atomic_sub(volatile __local unsigned int *p, | ||
| 3375 | + unsigned int val); | ||
| 3376 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3377 | int __ovld atomic_sub(volatile int *p, int val); | ||
| 3378 | unsigned int __ovld atomic_sub(volatile unsigned int *p, unsigned int val); | ||
| 3379 | @@ -13086,9 +13095,11 @@ unsigned long __ovld atom_sub(volatile __local unsigned long *p, unsigned long v | ||
| 3380 | * value. | ||
| 3381 | */ | ||
| 3382 | int __ovld atomic_xchg(volatile __global int *p, int val); | ||
| 3383 | -unsigned int __ovld atomic_xchg(volatile __global unsigned int *p, unsigned int val); | ||
| 3384 | +unsigned int __ovld atomic_xchg(volatile __global unsigned int *p, | ||
| 3385 | + unsigned int val); | ||
| 3386 | int __ovld atomic_xchg(volatile __local int *p, int val); | ||
| 3387 | -unsigned int __ovld atomic_xchg(volatile __local unsigned int *p, unsigned int val); | ||
| 3388 | +unsigned int __ovld atomic_xchg(volatile __local unsigned int *p, | ||
| 3389 | + unsigned int val); | ||
| 3390 | float __ovld atomic_xchg(volatile __global float *p, float val); | ||
| 3391 | float __ovld atomic_xchg(volatile __local float *p, float val); | ||
| 3392 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3393 | @@ -13183,12 +13194,15 @@ unsigned long __ovld atom_dec(volatile __local unsigned long *p); | ||
| 3394 | * returns old. | ||
| 3395 | */ | ||
| 3396 | int __ovld atomic_cmpxchg(volatile __global int *p, int cmp, int val); | ||
| 3397 | -unsigned int __ovld atomic_cmpxchg(volatile __global unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3398 | +unsigned int __ovld atomic_cmpxchg(volatile __global unsigned int *p, | ||
| 3399 | + unsigned int cmp, unsigned int val); | ||
| 3400 | int __ovld atomic_cmpxchg(volatile __local int *p, int cmp, int val); | ||
| 3401 | -unsigned int __ovld atomic_cmpxchg(volatile __local unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3402 | +unsigned int __ovld atomic_cmpxchg(volatile __local unsigned int *p, | ||
| 3403 | + unsigned int cmp, unsigned int val); | ||
| 3404 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3405 | int __ovld atomic_cmpxchg(volatile int *p, int cmp, int val); | ||
| 3406 | -unsigned int __ovld atomic_cmpxchg(volatile unsigned int *p, unsigned int cmp, unsigned int val); | ||
| 3407 | +unsigned int __ovld atomic_cmpxchg(volatile unsigned int *p, unsigned int cmp, | ||
| 3408 | + unsigned int val); | ||
| 3409 | #endif | ||
| 3410 | |||
| 3411 | #if defined(cl_khr_global_int32_base_atomics) | ||
| 3412 | @@ -13215,9 +13229,11 @@ unsigned long __ovld atom_cmpxchg(volatile __local unsigned long *p, unsigned lo | ||
| 3413 | * returns old. | ||
| 3414 | */ | ||
| 3415 | int __ovld atomic_min(volatile __global int *p, int val); | ||
| 3416 | -unsigned int __ovld atomic_min(volatile __global unsigned int *p, unsigned int val); | ||
| 3417 | +unsigned int __ovld atomic_min(volatile __global unsigned int *p, | ||
| 3418 | + unsigned int val); | ||
| 3419 | int __ovld atomic_min(volatile __local int *p, int val); | ||
| 3420 | -unsigned int __ovld atomic_min(volatile __local unsigned int *p, unsigned int val); | ||
| 3421 | +unsigned int __ovld atomic_min(volatile __local unsigned int *p, | ||
| 3422 | + unsigned int val); | ||
| 3423 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3424 | int __ovld atomic_min(volatile int *p, int val); | ||
| 3425 | unsigned int __ovld atomic_min(volatile unsigned int *p, unsigned int val); | ||
| 3426 | @@ -13247,9 +13263,11 @@ unsigned long __ovld atom_min(volatile __local unsigned long *p, unsigned long v | ||
| 3427 | * returns old. | ||
| 3428 | */ | ||
| 3429 | int __ovld atomic_max(volatile __global int *p, int val); | ||
| 3430 | -unsigned int __ovld atomic_max(volatile __global unsigned int *p, unsigned int val); | ||
| 3431 | +unsigned int __ovld atomic_max(volatile __global unsigned int *p, | ||
| 3432 | + unsigned int val); | ||
| 3433 | int __ovld atomic_max(volatile __local int *p, int val); | ||
| 3434 | -unsigned int __ovld atomic_max(volatile __local unsigned int *p, unsigned int val); | ||
| 3435 | +unsigned int __ovld atomic_max(volatile __local unsigned int *p, | ||
| 3436 | + unsigned int val); | ||
| 3437 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3438 | int __ovld atomic_max(volatile int *p, int val); | ||
| 3439 | unsigned int __ovld atomic_max(volatile unsigned int *p, unsigned int val); | ||
| 3440 | @@ -13278,9 +13296,11 @@ unsigned long __ovld atom_max(volatile __local unsigned long *p, unsigned long v | ||
| 3441 | * pointed by p. The function returns old. | ||
| 3442 | */ | ||
| 3443 | int __ovld atomic_and(volatile __global int *p, int val); | ||
| 3444 | -unsigned int __ovld atomic_and(volatile __global unsigned int *p, unsigned int val); | ||
| 3445 | +unsigned int __ovld atomic_and(volatile __global unsigned int *p, | ||
| 3446 | + unsigned int val); | ||
| 3447 | int __ovld atomic_and(volatile __local int *p, int val); | ||
| 3448 | -unsigned int __ovld atomic_and(volatile __local unsigned int *p, unsigned int val); | ||
| 3449 | +unsigned int __ovld atomic_and(volatile __local unsigned int *p, | ||
| 3450 | + unsigned int val); | ||
| 3451 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3452 | int __ovld atomic_and(volatile int *p, int val); | ||
| 3453 | unsigned int __ovld atomic_and(volatile unsigned int *p, unsigned int val); | ||
| 3454 | @@ -13309,9 +13329,11 @@ unsigned long __ovld atom_and(volatile __local unsigned long *p, unsigned long v | ||
| 3455 | * pointed by p. The function returns old. | ||
| 3456 | */ | ||
| 3457 | int __ovld atomic_or(volatile __global int *p, int val); | ||
| 3458 | -unsigned int __ovld atomic_or(volatile __global unsigned int *p, unsigned int val); | ||
| 3459 | +unsigned int __ovld atomic_or(volatile __global unsigned int *p, | ||
| 3460 | + unsigned int val); | ||
| 3461 | int __ovld atomic_or(volatile __local int *p, int val); | ||
| 3462 | -unsigned int __ovld atomic_or(volatile __local unsigned int *p, unsigned int val); | ||
| 3463 | +unsigned int __ovld atomic_or(volatile __local unsigned int *p, | ||
| 3464 | + unsigned int val); | ||
| 3465 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3466 | int __ovld atomic_or(volatile int *p, int val); | ||
| 3467 | unsigned int __ovld atomic_or(volatile unsigned int *p, unsigned int val); | ||
| 3468 | @@ -13340,9 +13362,11 @@ unsigned long __ovld atom_or(volatile __local unsigned long *p, unsigned long va | ||
| 3469 | * pointed by p. The function returns old. | ||
| 3470 | */ | ||
| 3471 | int __ovld atomic_xor(volatile __global int *p, int val); | ||
| 3472 | -unsigned int __ovld atomic_xor(volatile __global unsigned int *p, unsigned int val); | ||
| 3473 | +unsigned int __ovld atomic_xor(volatile __global unsigned int *p, | ||
| 3474 | + unsigned int val); | ||
| 3475 | int __ovld atomic_xor(volatile __local int *p, int val); | ||
| 3476 | -unsigned int __ovld atomic_xor(volatile __local unsigned int *p, unsigned int val); | ||
| 3477 | +unsigned int __ovld atomic_xor(volatile __local unsigned int *p, | ||
| 3478 | + unsigned int val); | ||
| 3479 | #ifdef __OPENCL_CPP_VERSION__ | ||
| 3480 | int __ovld atomic_xor(volatile int *p, int val); | ||
| 3481 | unsigned int __ovld atomic_xor(volatile unsigned int *p, unsigned int val); | ||
| 3482 | @@ -13380,108 +13404,78 @@ unsigned long __ovld atom_xor(volatile __local unsigned long *p, unsigned long v | ||
| 3483 | #endif | ||
| 3484 | |||
| 3485 | // atomic_init() | ||
| 3486 | +#ifdef __opencl_c_generic_address_space | ||
| 3487 | void __ovld atomic_init(volatile atomic_int *object, int value); | ||
| 3488 | void __ovld atomic_init(volatile atomic_uint *object, uint value); | ||
| 3489 | void __ovld atomic_init(volatile atomic_float *object, float value); | ||
| 3490 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3491 | void __ovld atomic_init(volatile atomic_long *object, long value); | ||
| 3492 | void __ovld atomic_init(volatile atomic_ulong *object, ulong value); | ||
| 3493 | -#ifdef cl_khr_fp64 | ||
| 3494 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3495 | void __ovld atomic_init(volatile atomic_double *object, double value); | ||
| 3496 | -#endif //cl_khr_fp64 | ||
| 3497 | -#endif | ||
| 3498 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3499 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3500 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3501 | +#endif // __opencl_c_generic_address_space | ||
| 3502 | + | ||
| 3503 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3504 | +void __ovld atomic_init(volatile atomic_int __global *object, int value); | ||
| 3505 | +void __ovld atomic_init(volatile atomic_int __local *object, int value); | ||
| 3506 | +void __ovld atomic_init(volatile atomic_uint __global *object, uint value); | ||
| 3507 | +void __ovld atomic_init(volatile atomic_uint __local *object, uint value); | ||
| 3508 | +void __ovld atomic_init(volatile atomic_float __global *object, float value); | ||
| 3509 | +void __ovld atomic_init(volatile atomic_float __local *object, float value); | ||
| 3510 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3511 | +void __ovld atomic_init(volatile atomic_long __global *object, long value); | ||
| 3512 | +void __ovld atomic_init(volatile atomic_long __local *object, long value); | ||
| 3513 | +void __ovld atomic_init(volatile atomic_ulong __global *object, ulong value); | ||
| 3514 | +void __ovld atomic_init(volatile atomic_ulong __local *object, ulong value); | ||
| 3515 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 3516 | +void __ovld atomic_init(volatile atomic_double __global *object, double value); | ||
| 3517 | +void __ovld atomic_init(volatile atomic_double __local *object, double value); | ||
| 3518 | +#endif // cl_khr_fp64 | ||
| 3519 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3520 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3521 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3522 | |||
| 3523 | // atomic_work_item_fence() | ||
| 3524 | -void __ovld atomic_work_item_fence(cl_mem_fence_flags flags, memory_order order, memory_scope scope); | ||
| 3525 | +void __ovld atomic_work_item_fence(cl_mem_fence_flags flags, memory_order order, | ||
| 3526 | + memory_scope scope); | ||
| 3527 | |||
| 3528 | // atomic_fetch() | ||
| 3529 | - | ||
| 3530 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 3531 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 3532 | +#ifdef __opencl_c_generic_address_space | ||
| 3533 | int __ovld atomic_fetch_add(volatile atomic_int *object, int operand); | ||
| 3534 | -int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3535 | -int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3536 | uint __ovld atomic_fetch_add(volatile atomic_uint *object, uint operand); | ||
| 3537 | -uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3538 | -uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3539 | int __ovld atomic_fetch_sub(volatile atomic_int *object, int operand); | ||
| 3540 | -int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3541 | -int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3542 | uint __ovld atomic_fetch_sub(volatile atomic_uint *object, uint operand); | ||
| 3543 | -uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3544 | -uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3545 | int __ovld atomic_fetch_or(volatile atomic_int *object, int operand); | ||
| 3546 | -int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3547 | -int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3548 | uint __ovld atomic_fetch_or(volatile atomic_uint *object, uint operand); | ||
| 3549 | -uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3550 | -uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3551 | int __ovld atomic_fetch_xor(volatile atomic_int *object, int operand); | ||
| 3552 | -int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3553 | -int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3554 | uint __ovld atomic_fetch_xor(volatile atomic_uint *object, uint operand); | ||
| 3555 | -uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3556 | -uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3557 | int __ovld atomic_fetch_and(volatile atomic_int *object, int operand); | ||
| 3558 | -int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3559 | -int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3560 | uint __ovld atomic_fetch_and(volatile atomic_uint *object, uint operand); | ||
| 3561 | -uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3562 | -uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3563 | int __ovld atomic_fetch_min(volatile atomic_int *object, int operand); | ||
| 3564 | -int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3565 | -int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3566 | uint __ovld atomic_fetch_min(volatile atomic_uint *object, uint operand); | ||
| 3567 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3568 | -uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3569 | int __ovld atomic_fetch_max(volatile atomic_int *object, int operand); | ||
| 3570 | -int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, memory_order order); | ||
| 3571 | -int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, memory_order order, memory_scope scope); | ||
| 3572 | uint __ovld atomic_fetch_max(volatile atomic_uint *object, uint operand); | ||
| 3573 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, uint operand, memory_order order); | ||
| 3574 | -uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, uint operand, memory_order order, memory_scope scope); | ||
| 3575 | |||
| 3576 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3577 | long __ovld atomic_fetch_add(volatile atomic_long *object, long operand); | ||
| 3578 | -long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3579 | -long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3580 | ulong __ovld atomic_fetch_add(volatile atomic_ulong *object, ulong operand); | ||
| 3581 | -ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3582 | -ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3583 | long __ovld atomic_fetch_sub(volatile atomic_long *object, long operand); | ||
| 3584 | -long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3585 | -long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3586 | ulong __ovld atomic_fetch_sub(volatile atomic_ulong *object, ulong operand); | ||
| 3587 | -ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3588 | -ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3589 | long __ovld atomic_fetch_or(volatile atomic_long *object, long operand); | ||
| 3590 | -long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3591 | -long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3592 | ulong __ovld atomic_fetch_or(volatile atomic_ulong *object, ulong operand); | ||
| 3593 | -ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3594 | -ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3595 | long __ovld atomic_fetch_xor(volatile atomic_long *object, long operand); | ||
| 3596 | -long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3597 | -long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3598 | ulong __ovld atomic_fetch_xor(volatile atomic_ulong *object, ulong operand); | ||
| 3599 | -ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3600 | -ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3601 | long __ovld atomic_fetch_and(volatile atomic_long *object, long operand); | ||
| 3602 | -long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3603 | -long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3604 | ulong __ovld atomic_fetch_and(volatile atomic_ulong *object, ulong operand); | ||
| 3605 | -ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3606 | -ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3607 | long __ovld atomic_fetch_min(volatile atomic_long *object, long operand); | ||
| 3608 | -long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3609 | -long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3610 | ulong __ovld atomic_fetch_min(volatile atomic_ulong *object, ulong operand); | ||
| 3611 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3612 | -ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3613 | long __ovld atomic_fetch_max(volatile atomic_long *object, long operand); | ||
| 3614 | -long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, long operand, memory_order order); | ||
| 3615 | -long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, long operand, memory_order order, memory_scope scope); | ||
| 3616 | ulong __ovld atomic_fetch_max(volatile atomic_ulong *object, ulong operand); | ||
| 3617 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, ulong operand, memory_order order); | ||
| 3618 | -ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, ulong operand, memory_order order, memory_scope scope); | ||
| 3619 | #endif //defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3620 | |||
| 3621 | // OpenCL v2.0 s6.13.11.7.5: | ||
| 3622 | @@ -13489,196 +13483,2239 @@ ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, ulong oper | ||
| 3623 | // or/xor/and/min/max: atomic type argument can be intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 3624 | |||
| 3625 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3626 | -uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t *object, ptrdiff_t operand); | ||
| 3627 | -uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order); | ||
| 3628 | -uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order, memory_scope scope); | ||
| 3629 | -uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t *object, ptrdiff_t operand); | ||
| 3630 | -uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order); | ||
| 3631 | -uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, ptrdiff_t operand, memory_order order, memory_scope scope); | ||
| 3632 | - | ||
| 3633 | -uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3634 | -uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3635 | -uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3636 | -uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3637 | -uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3638 | -uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3639 | -uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t *object, intptr_t operand); | ||
| 3640 | -uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order); | ||
| 3641 | -uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, intptr_t operand, memory_order order, memory_scope scope); | ||
| 3642 | -uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t *object, intptr_t opermax); | ||
| 3643 | -uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder); | ||
| 3644 | -uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3645 | -uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t *object, intptr_t opermax); | ||
| 3646 | -uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder); | ||
| 3647 | -uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, intptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3648 | - | ||
| 3649 | -intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3650 | -intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3651 | -intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3652 | -intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3653 | -intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3654 | -intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3655 | -intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t *object, uintptr_t operand); | ||
| 3656 | -intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order); | ||
| 3657 | -intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, uintptr_t operand, memory_order order, memory_scope scope); | ||
| 3658 | -intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t *object, uintptr_t opermax); | ||
| 3659 | -intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder); | ||
| 3660 | -intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3661 | -intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t *object, uintptr_t opermax); | ||
| 3662 | -intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder); | ||
| 3663 | -intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, uintptr_t opermax, memory_order minder, memory_scope scope); | ||
| 3664 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t *object, | ||
| 3665 | + ptrdiff_t operand); | ||
| 3666 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t *object, | ||
| 3667 | + ptrdiff_t operand); | ||
| 3668 | + | ||
| 3669 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t *object, | ||
| 3670 | + intptr_t operand); | ||
| 3671 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t *object, | ||
| 3672 | + intptr_t operand); | ||
| 3673 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t *object, | ||
| 3674 | + intptr_t operand); | ||
| 3675 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t *object, | ||
| 3676 | + intptr_t opermax); | ||
| 3677 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t *object, | ||
| 3678 | + intptr_t opermax); | ||
| 3679 | + | ||
| 3680 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t *object, | ||
| 3681 | + uintptr_t operand); | ||
| 3682 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t *object, | ||
| 3683 | + uintptr_t operand); | ||
| 3684 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t *object, | ||
| 3685 | + uintptr_t operand); | ||
| 3686 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t *object, | ||
| 3687 | + uintptr_t opermax); | ||
| 3688 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t *object, | ||
| 3689 | + uintptr_t opermax); | ||
| 3690 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3691 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3692 | +#endif // __opencl_c_generic_address_space | ||
| 3693 | + | ||
| 3694 | +#if(__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3695 | +int __ovld atomic_fetch_add(volatile atomic_int __global *object, int operand); | ||
| 3696 | +uint __ovld atomic_fetch_add(volatile atomic_uint __local *object, | ||
| 3697 | + uint operand); | ||
| 3698 | +int __ovld atomic_fetch_sub(volatile atomic_int __global *object, int operand); | ||
| 3699 | +int __ovld atomic_fetch_sub(volatile atomic_int __local *object, int operand); | ||
| 3700 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __local *object, | ||
| 3701 | + uint operand); | ||
| 3702 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __global *object, | ||
| 3703 | + uint operand); | ||
| 3704 | +int __ovld atomic_fetch_or(volatile atomic_int __global *object, int operand); | ||
| 3705 | +uint __ovld atomic_fetch_sub(volatile atomic_uint __local *object, | ||
| 3706 | + uint operand); | ||
| 3707 | +uint __ovld atomic_fetch_or(volatile atomic_uint __global *object, | ||
| 3708 | + uint operand); | ||
| 3709 | +uint __ovld atomic_fetch_or(volatile atomic_uint __local *object, uint operand); | ||
| 3710 | +int __ovld atomic_fetch_xor(volatile atomic_int __global *object, int operand); | ||
| 3711 | +int __ovld atomic_fetch_xor(volatile atomic_int __local *object, int operand); | ||
| 3712 | +uint __ovld atomic_fetch_xor(volatile atomic_uint __global *object, | ||
| 3713 | + uint operand); | ||
| 3714 | +uint __ovld atomic_fetch_xor(volatile atomic_uint __local *object, | ||
| 3715 | + uint operand); | ||
| 3716 | +int __ovld atomic_fetch_and(volatile atomic_int __global *object, int operand); | ||
| 3717 | +int __ovld atomic_fetch_and(volatile atomic_int __local *object, int operand); | ||
| 3718 | +uint __ovld atomic_fetch_and(volatile atomic_uint __global *object, | ||
| 3719 | + uint operand); | ||
| 3720 | +uint __ovld atomic_fetch_and(volatile atomic_uint __local *object, | ||
| 3721 | + uint operand); | ||
| 3722 | +int __ovld atomic_fetch_min(volatile atomic_int __global *object, int operand); | ||
| 3723 | +int __ovld atomic_fetch_min(volatile atomic_int __local *object, int operand); | ||
| 3724 | +uint __ovld atomic_fetch_min(volatile atomic_uint __global *object, | ||
| 3725 | + uint operand); | ||
| 3726 | +uint __ovld atomic_fetch_min(volatile atomic_uint __local *object, | ||
| 3727 | + uint operand); | ||
| 3728 | +int __ovld atomic_fetch_max(volatile atomic_int __global *object, int operand); | ||
| 3729 | +int __ovld atomic_fetch_max(volatile atomic_int __local *object, int operand); | ||
| 3730 | +uint __ovld atomic_fetch_max(volatile atomic_uint __global *object, | ||
| 3731 | + uint operand); | ||
| 3732 | +uint __ovld atomic_fetch_max(volatile atomic_uint __local *object, | ||
| 3733 | + uint operand); | ||
| 3734 | + | ||
| 3735 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3736 | +long __ovld atomic_fetch_add(volatile atomic_long __global *object, | ||
| 3737 | + long operand); | ||
| 3738 | +long __ovld atomic_fetch_add(volatile atomic_long __local *object, | ||
| 3739 | + long operand); | ||
| 3740 | +ulong __ovld atomic_fetch_add(volatile atomic_ulong __global *object, | ||
| 3741 | + ulong operand); | ||
| 3742 | +ulong __ovld atomic_fetch_add(volatile atomic_ulong __local *object, | ||
| 3743 | + ulong operand); | ||
| 3744 | +long __ovld atomic_fetch_sub(volatile atomic_long __global *object, | ||
| 3745 | + long operand); | ||
| 3746 | +long __ovld atomic_fetch_sub(volatile atomic_long __local *object, | ||
| 3747 | + long operand); | ||
| 3748 | +ulong __ovld atomic_fetch_sub(volatile atomic_ulong __global *object, | ||
| 3749 | + ulong operand); | ||
| 3750 | +ulong __ovld atomic_fetch_sub(volatile atomic_ulong __local *object, | ||
| 3751 | + ulong operand); | ||
| 3752 | +long __ovld atomic_fetch_or(volatile atomic_long __global *object, | ||
| 3753 | + long operand); | ||
| 3754 | +long __ovld atomic_fetch_or(volatile atomic_long __local *object, long operand); | ||
| 3755 | +ulong __ovld atomic_fetch_or(volatile atomic_ulong __global *object, | ||
| 3756 | + ulong operand); | ||
| 3757 | +ulong __ovld atomic_fetch_or(volatile atomic_ulong __local *object, | ||
| 3758 | + ulong operand); | ||
| 3759 | +long __ovld atomic_fetch_xor(volatile atomic_long __global *object, | ||
| 3760 | + long operand); | ||
| 3761 | +long __ovld atomic_fetch_xor(volatile atomic_long __local *object, | ||
| 3762 | + long operand); | ||
| 3763 | +ulong __ovld atomic_fetch_xor(volatile atomic_ulong __global *object, | ||
| 3764 | + ulong operand); | ||
| 3765 | +ulong __ovld atomic_fetch_xor(volatile atomic_ulong __local *object, | ||
| 3766 | + ulong operand); | ||
| 3767 | +long __ovld atomic_fetch_and(volatile atomic_long __global *object, | ||
| 3768 | + long operand); | ||
| 3769 | +long __ovld atomic_fetch_and(volatile atomic_long __local *object, | ||
| 3770 | + long operand); | ||
| 3771 | +ulong __ovld atomic_fetch_and(volatile atomic_ulong __global *object, | ||
| 3772 | + ulong operand); | ||
| 3773 | +ulong __ovld atomic_fetch_and(volatile atomic_ulong __local *object, | ||
| 3774 | + ulong operand); | ||
| 3775 | +long __ovld atomic_fetch_min(volatile atomic_long __global *object, | ||
| 3776 | + long operand); | ||
| 3777 | +long __ovld atomic_fetch_min(volatile atomic_long __local *object, | ||
| 3778 | + long operand); | ||
| 3779 | +ulong __ovld atomic_fetch_min(volatile atomic_ulong __global *object, | ||
| 3780 | + ulong operand); | ||
| 3781 | +ulong __ovld atomic_fetch_min(volatile atomic_ulong __local *object, | ||
| 3782 | + ulong operand); | ||
| 3783 | +long __ovld atomic_fetch_max(volatile atomic_long __global *object, | ||
| 3784 | + long operand); | ||
| 3785 | +long __ovld atomic_fetch_max(volatile atomic_long __local *object, | ||
| 3786 | + long operand); | ||
| 3787 | +ulong __ovld atomic_fetch_max(volatile atomic_ulong __global *object, | ||
| 3788 | + ulong operand); | ||
| 3789 | +ulong __ovld atomic_fetch_max(volatile atomic_ulong __local *object, | ||
| 3790 | + ulong operand); | ||
| 3791 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3792 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3793 | + | ||
| 3794 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 3795 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 3796 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 3797 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 3798 | + | ||
| 3799 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3800 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t __global *object, | ||
| 3801 | + ptrdiff_t operand); | ||
| 3802 | +uintptr_t __ovld atomic_fetch_add(volatile atomic_uintptr_t __local *object, | ||
| 3803 | + ptrdiff_t operand); | ||
| 3804 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t __global *object, | ||
| 3805 | + ptrdiff_t operand); | ||
| 3806 | +uintptr_t __ovld atomic_fetch_sub(volatile atomic_uintptr_t __local *object, | ||
| 3807 | + ptrdiff_t operand); | ||
| 3808 | + | ||
| 3809 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t __global *object, | ||
| 3810 | + intptr_t operand); | ||
| 3811 | +uintptr_t __ovld atomic_fetch_or(volatile atomic_uintptr_t __local *object, | ||
| 3812 | + intptr_t operand); | ||
| 3813 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t __global *object, | ||
| 3814 | + intptr_t operand); | ||
| 3815 | +uintptr_t __ovld atomic_fetch_xor(volatile atomic_uintptr_t __local *object, | ||
| 3816 | + intptr_t operand); | ||
| 3817 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t __global *object, | ||
| 3818 | + intptr_t operand); | ||
| 3819 | +uintptr_t __ovld atomic_fetch_and(volatile atomic_uintptr_t __local *object, | ||
| 3820 | + intptr_t operand); | ||
| 3821 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t __global *object, | ||
| 3822 | + intptr_t opermax); | ||
| 3823 | +uintptr_t __ovld atomic_fetch_min(volatile atomic_uintptr_t __local *object, | ||
| 3824 | + intptr_t opermax); | ||
| 3825 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t __global *object, | ||
| 3826 | + intptr_t opermax); | ||
| 3827 | +uintptr_t __ovld atomic_fetch_max(volatile atomic_uintptr_t __local *object, | ||
| 3828 | + intptr_t opermax); | ||
| 3829 | + | ||
| 3830 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t __global *object, | ||
| 3831 | + uintptr_t operand); | ||
| 3832 | +intptr_t __ovld atomic_fetch_or(volatile atomic_intptr_t __local *object, | ||
| 3833 | + uintptr_t operand); | ||
| 3834 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t __global *object, | ||
| 3835 | + uintptr_t operand); | ||
| 3836 | +intptr_t __ovld atomic_fetch_xor(volatile atomic_intptr_t __local *object, | ||
| 3837 | + uintptr_t operand); | ||
| 3838 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t __global *object, | ||
| 3839 | + uintptr_t operand); | ||
| 3840 | +intptr_t __ovld atomic_fetch_and(volatile atomic_intptr_t __local *object, | ||
| 3841 | + uintptr_t operand); | ||
| 3842 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t __global *object, | ||
| 3843 | + uintptr_t opermax); | ||
| 3844 | +intptr_t __ovld atomic_fetch_min(volatile atomic_intptr_t __local *object, | ||
| 3845 | + uintptr_t opermax); | ||
| 3846 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t __global *object, | ||
| 3847 | + uintptr_t opermax); | ||
| 3848 | +intptr_t __ovld atomic_fetch_max(volatile atomic_intptr_t __local *object, | ||
| 3849 | + uintptr_t opermax); | ||
| 3850 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3851 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3852 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 3853 | + | ||
| 3854 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 3855 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 3856 | + | ||
| 3857 | +#ifdef __opencl_c_generic_address_space | ||
| 3858 | +#ifdef __opencl_c_atomic_scope_device | ||
| 3859 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, | ||
| 3860 | + memory_order order); | ||
| 3861 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, | ||
| 3862 | + uint operand, memory_order order); | ||
| 3863 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, | ||
| 3864 | + memory_order order); | ||
| 3865 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, | ||
| 3866 | + uint operand, memory_order order); | ||
| 3867 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, | ||
| 3868 | + memory_order order); | ||
| 3869 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, | ||
| 3870 | + memory_order order); | ||
| 3871 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, | ||
| 3872 | + memory_order order); | ||
| 3873 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, | ||
| 3874 | + uint operand, memory_order order); | ||
| 3875 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, | ||
| 3876 | + memory_order order); | ||
| 3877 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, | ||
| 3878 | + uint operand, memory_order order); | ||
| 3879 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, | ||
| 3880 | + memory_order order); | ||
| 3881 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, | ||
| 3882 | + uint operand, memory_order order); | ||
| 3883 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, | ||
| 3884 | + memory_order order); | ||
| 3885 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, | ||
| 3886 | + uint operand, memory_order order); | ||
| 3887 | +#endif // __opencl_c_atomic_scope_device | ||
| 3888 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int *object, int operand, | ||
| 3889 | + memory_order order, memory_scope scope); | ||
| 3890 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint *object, | ||
| 3891 | + uint operand, memory_order order, | ||
| 3892 | + memory_scope scope); | ||
| 3893 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int *object, int operand, | ||
| 3894 | + memory_order order, memory_scope scope); | ||
| 3895 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint *object, | ||
| 3896 | + uint operand, memory_order order, | ||
| 3897 | + memory_scope scope); | ||
| 3898 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int *object, int operand, | ||
| 3899 | + memory_order order, memory_scope scope); | ||
| 3900 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint *object, uint operand, | ||
| 3901 | + memory_order order, memory_scope scope); | ||
| 3902 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int *object, int operand, | ||
| 3903 | + memory_order order, memory_scope scope); | ||
| 3904 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint *object, | ||
| 3905 | + uint operand, memory_order order, | ||
| 3906 | + memory_scope scope); | ||
| 3907 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int *object, int operand, | ||
| 3908 | + memory_order order, memory_scope scope); | ||
| 3909 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint *object, | ||
| 3910 | + uint operand, memory_order order, | ||
| 3911 | + memory_scope scope); | ||
| 3912 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, | ||
| 3913 | + memory_order order, memory_scope scope); | ||
| 3914 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint *object, | ||
| 3915 | + uint operand, memory_order order, | ||
| 3916 | + memory_scope scope); | ||
| 3917 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, | ||
| 3918 | + memory_order order, memory_scope scope); | ||
| 3919 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint *object, | ||
| 3920 | + uint operand, memory_order order, | ||
| 3921 | + memory_scope scope); | ||
| 3922 | + | ||
| 3923 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 3924 | +#ifdef __opencl_c_atomic_scope_device | ||
| 3925 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, | ||
| 3926 | + long operand, memory_order order); | ||
| 3927 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, | ||
| 3928 | + ulong operand, memory_order order); | ||
| 3929 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, | ||
| 3930 | + long operand, memory_order order); | ||
| 3931 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, | ||
| 3932 | + ulong operand, memory_order order); | ||
| 3933 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, | ||
| 3934 | + memory_order order); | ||
| 3935 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, | ||
| 3936 | + ulong operand, memory_order order); | ||
| 3937 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, | ||
| 3938 | + long operand, memory_order order); | ||
| 3939 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, | ||
| 3940 | + ulong operand, memory_order order); | ||
| 3941 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, | ||
| 3942 | + long operand, memory_order order); | ||
| 3943 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, | ||
| 3944 | + ulong operand, memory_order order); | ||
| 3945 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, | ||
| 3946 | + long operand, memory_order order); | ||
| 3947 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, | ||
| 3948 | + ulong operand, memory_order order); | ||
| 3949 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, | ||
| 3950 | + long operand, memory_order order); | ||
| 3951 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, | ||
| 3952 | + ulong operand, memory_order order); | ||
| 3953 | +#endif // __opencl_c_atomic_scope_device | ||
| 3954 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long *object, | ||
| 3955 | + long operand, memory_order order, | ||
| 3956 | + memory_scope scope); | ||
| 3957 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong *object, | ||
| 3958 | + ulong operand, memory_order order, | ||
| 3959 | + memory_scope scope); | ||
| 3960 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long *object, | ||
| 3961 | + long operand, memory_order order, | ||
| 3962 | + memory_scope scope); | ||
| 3963 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong *object, | ||
| 3964 | + ulong operand, memory_order order, | ||
| 3965 | + memory_scope scope); | ||
| 3966 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long *object, long operand, | ||
| 3967 | + memory_order order, memory_scope scope); | ||
| 3968 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong *object, | ||
| 3969 | + ulong operand, memory_order order, | ||
| 3970 | + memory_scope scope); | ||
| 3971 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long *object, | ||
| 3972 | + long operand, memory_order order, | ||
| 3973 | + memory_scope scope); | ||
| 3974 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong *object, | ||
| 3975 | + ulong operand, memory_order order, | ||
| 3976 | + memory_scope scope); | ||
| 3977 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long *object, | ||
| 3978 | + long operand, memory_order order, | ||
| 3979 | + memory_scope scope); | ||
| 3980 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong *object, | ||
| 3981 | + ulong operand, memory_order order, | ||
| 3982 | + memory_scope scope); | ||
| 3983 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long *object, | ||
| 3984 | + long operand, memory_order order, | ||
| 3985 | + memory_scope scope); | ||
| 3986 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong *object, | ||
| 3987 | + ulong operand, memory_order order, | ||
| 3988 | + memory_scope scope); | ||
| 3989 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long *object, | ||
| 3990 | + long operand, memory_order order, | ||
| 3991 | + memory_scope scope); | ||
| 3992 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong *object, | ||
| 3993 | + ulong operand, memory_order order, | ||
| 3994 | + memory_scope scope); | ||
| 3995 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 3996 | + // defined(cl_khr_int64_extended_atomics) | ||
| 3997 | + | ||
| 3998 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 3999 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 4000 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 4001 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 4002 | + | ||
| 4003 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4004 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4005 | +uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, | ||
| 4006 | + ptrdiff_t operand, | ||
| 4007 | + memory_order order); | ||
| 4008 | +uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, | ||
| 4009 | + ptrdiff_t operand, | ||
| 4010 | + memory_order order); | ||
| 4011 | +uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, | ||
| 4012 | + intptr_t operand, memory_order order); | ||
| 4013 | +uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, | ||
| 4014 | + intptr_t operand, | ||
| 4015 | + memory_order order); | ||
| 4016 | +uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, | ||
| 4017 | + intptr_t operand, | ||
| 4018 | + memory_order order); | ||
| 4019 | +uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, | ||
| 4020 | + intptr_t opermax, | ||
| 4021 | + memory_order minder); | ||
| 4022 | +uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, | ||
| 4023 | + intptr_t opermax, | ||
| 4024 | + memory_order minder); | ||
| 4025 | +intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, | ||
| 4026 | + uintptr_t operand, memory_order order); | ||
| 4027 | +intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, | ||
| 4028 | + uintptr_t operand, | ||
| 4029 | + memory_order order); | ||
| 4030 | +intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, | ||
| 4031 | + uintptr_t operand, | ||
| 4032 | + memory_order order); | ||
| 4033 | +intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, | ||
| 4034 | + uintptr_t opermax, | ||
| 4035 | + memory_order minder); | ||
| 4036 | +intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, | ||
| 4037 | + uintptr_t opermax, | ||
| 4038 | + memory_order minder); | ||
| 4039 | +#endif // __opencl_c_atomic_scope_device | ||
| 4040 | +uintptr_t __ovld atomic_fetch_add_explicit(volatile atomic_uintptr_t *object, | ||
| 4041 | + ptrdiff_t operand, | ||
| 4042 | + memory_order order, | ||
| 4043 | + memory_scope scope); | ||
| 4044 | +uintptr_t __ovld atomic_fetch_sub_explicit(volatile atomic_uintptr_t *object, | ||
| 4045 | + ptrdiff_t operand, | ||
| 4046 | + memory_order order, | ||
| 4047 | + memory_scope scope); | ||
| 4048 | + | ||
| 4049 | +uintptr_t __ovld atomic_fetch_or_explicit(volatile atomic_uintptr_t *object, | ||
| 4050 | + intptr_t operand, memory_order order, | ||
| 4051 | + memory_scope scope); | ||
| 4052 | +uintptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_uintptr_t *object, | ||
| 4053 | + intptr_t operand, memory_order order, | ||
| 4054 | + memory_scope scope); | ||
| 4055 | +uintptr_t __ovld atomic_fetch_and_explicit(volatile atomic_uintptr_t *object, | ||
| 4056 | + intptr_t operand, memory_order order, | ||
| 4057 | + memory_scope scope); | ||
| 4058 | +uintptr_t __ovld atomic_fetch_min_explicit(volatile atomic_uintptr_t *object, | ||
| 4059 | + intptr_t opermax, | ||
| 4060 | + memory_order minder, | ||
| 4061 | + memory_scope scope); | ||
| 4062 | +uintptr_t __ovld atomic_fetch_max_explicit(volatile atomic_uintptr_t *object, | ||
| 4063 | + intptr_t opermax, | ||
| 4064 | + memory_order minder, | ||
| 4065 | + memory_scope scope); | ||
| 4066 | + | ||
| 4067 | +intptr_t __ovld atomic_fetch_or_explicit(volatile atomic_intptr_t *object, | ||
| 4068 | + uintptr_t operand, memory_order order, | ||
| 4069 | + memory_scope scope); | ||
| 4070 | +intptr_t __ovld atomic_fetch_xor_explicit(volatile atomic_intptr_t *object, | ||
| 4071 | + uintptr_t operand, memory_order order, | ||
| 4072 | + memory_scope scope); | ||
| 4073 | +intptr_t __ovld atomic_fetch_and_explicit(volatile atomic_intptr_t *object, | ||
| 4074 | + uintptr_t operand, memory_order order, | ||
| 4075 | + memory_scope scope); | ||
| 4076 | +intptr_t __ovld atomic_fetch_min_explicit(volatile atomic_intptr_t *object, | ||
| 4077 | + uintptr_t opermax, | ||
| 4078 | + memory_order minder, | ||
| 4079 | + memory_scope scope); | ||
| 4080 | +intptr_t __ovld atomic_fetch_max_explicit(volatile atomic_intptr_t *object, | ||
| 4081 | + uintptr_t opermax, | ||
| 4082 | + memory_order minder, | ||
| 4083 | + memory_scope scope); | ||
| 4084 | #endif | ||
| 4085 | +#endif // __opencl_c_generic_address_space | ||
| 4086 | + | ||
| 4087 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4088 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4089 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __global *object, | ||
| 4090 | + int operand, memory_order order); | ||
| 4091 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __local *object, | ||
| 4092 | + int operand, memory_order order); | ||
| 4093 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __global *object, | ||
| 4094 | + uint operand, memory_order order); | ||
| 4095 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __local *object, | ||
| 4096 | + uint operand, memory_order order); | ||
| 4097 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __global *object, | ||
| 4098 | + int operand, memory_order order); | ||
| 4099 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __local *object, | ||
| 4100 | + int operand, memory_order order); | ||
| 4101 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __global *object, | ||
| 4102 | + uint operand, memory_order order); | ||
| 4103 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __local *object, | ||
| 4104 | + uint operand, memory_order order); | ||
| 4105 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __global *object, | ||
| 4106 | + int operand, memory_order order); | ||
| 4107 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __local *object, | ||
| 4108 | + int operand, memory_order order); | ||
| 4109 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __global *object, | ||
| 4110 | + uint operand, memory_order order); | ||
| 4111 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __local *object, | ||
| 4112 | + uint operand, memory_order order); | ||
| 4113 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __global *object, | ||
| 4114 | + int operand, memory_order order); | ||
| 4115 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __local *object, | ||
| 4116 | + int operand, memory_order order); | ||
| 4117 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __global *object, | ||
| 4118 | + uint operand, memory_order order); | ||
| 4119 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __local *object, | ||
| 4120 | + uint operand, memory_order order); | ||
| 4121 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __global *object, | ||
| 4122 | + int operand, memory_order order); | ||
| 4123 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __local *object, | ||
| 4124 | + int operand, memory_order order); | ||
| 4125 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __global *object, | ||
| 4126 | + uint operand, memory_order order); | ||
| 4127 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __local *object, | ||
| 4128 | + uint operand, memory_order order); | ||
| 4129 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __global *object, | ||
| 4130 | + int operand, memory_order order); | ||
| 4131 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __local *object, | ||
| 4132 | + int operand, memory_order order); | ||
| 4133 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __global *object, | ||
| 4134 | + uint operand, memory_order order); | ||
| 4135 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __local *object, | ||
| 4136 | + uint operand, memory_order order); | ||
| 4137 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __global *object, | ||
| 4138 | + int operand, memory_order order); | ||
| 4139 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __local *object, | ||
| 4140 | + int operand, memory_order order); | ||
| 4141 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __global *object, | ||
| 4142 | + uint operand, memory_order order); | ||
| 4143 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __local *object, | ||
| 4144 | + uint operand, memory_order order); | ||
| 4145 | +#endif // __opencl_c_atomic_scope_device | ||
| 4146 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __global *object, | ||
| 4147 | + int operand, memory_order order, | ||
| 4148 | + memory_scope scope); | ||
| 4149 | +int __ovld atomic_fetch_add_explicit(volatile atomic_int __local *object, | ||
| 4150 | + int operand, memory_order order, | ||
| 4151 | + memory_scope scope); | ||
| 4152 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __global *object, | ||
| 4153 | + uint operand, memory_order order, | ||
| 4154 | + memory_scope scope); | ||
| 4155 | +uint __ovld atomic_fetch_add_explicit(volatile atomic_uint __local *object, | ||
| 4156 | + uint operand, memory_order order, | ||
| 4157 | + memory_scope scope); | ||
| 4158 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __global *object, | ||
| 4159 | + int operand, memory_order order, | ||
| 4160 | + memory_scope scope); | ||
| 4161 | +int __ovld atomic_fetch_sub_explicit(volatile atomic_int __local *object, | ||
| 4162 | + int operand, memory_order order, | ||
| 4163 | + memory_scope scope); | ||
| 4164 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __global *object, | ||
| 4165 | + uint operand, memory_order order, | ||
| 4166 | + memory_scope scope); | ||
| 4167 | +uint __ovld atomic_fetch_sub_explicit(volatile atomic_uint __local *object, | ||
| 4168 | + uint operand, memory_order order, | ||
| 4169 | + memory_scope scope); | ||
| 4170 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __global *object, | ||
| 4171 | + int operand, memory_order order, | ||
| 4172 | + memory_scope scope); | ||
| 4173 | +int __ovld atomic_fetch_or_explicit(volatile atomic_int __local *object, | ||
| 4174 | + int operand, memory_order order, | ||
| 4175 | + memory_scope scope); | ||
| 4176 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __global *object, | ||
| 4177 | + uint operand, memory_order order, | ||
| 4178 | + memory_scope scope); | ||
| 4179 | +uint __ovld atomic_fetch_or_explicit(volatile atomic_uint __local *object, | ||
| 4180 | + uint operand, memory_order order, | ||
| 4181 | + memory_scope scope); | ||
| 4182 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __global *object, | ||
| 4183 | + int operand, memory_order order, | ||
| 4184 | + memory_scope scope); | ||
| 4185 | +int __ovld atomic_fetch_xor_explicit(volatile atomic_int __local *object, | ||
| 4186 | + int operand, memory_order order, | ||
| 4187 | + memory_scope scope); | ||
| 4188 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __global *object, | ||
| 4189 | + uint operand, memory_order order, | ||
| 4190 | + memory_scope scope); | ||
| 4191 | +uint __ovld atomic_fetch_xor_explicit(volatile atomic_uint __local *object, | ||
| 4192 | + uint operand, memory_order order, | ||
| 4193 | + memory_scope scope); | ||
| 4194 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __global *object, | ||
| 4195 | + int operand, memory_order order, | ||
| 4196 | + memory_scope scope); | ||
| 4197 | +int __ovld atomic_fetch_and_explicit(volatile atomic_int __local *object, | ||
| 4198 | + int operand, memory_order order, | ||
| 4199 | + memory_scope scope); | ||
| 4200 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __global *object, | ||
| 4201 | + uint operand, memory_order order, | ||
| 4202 | + memory_scope scope); | ||
| 4203 | +uint __ovld atomic_fetch_and_explicit(volatile atomic_uint __local *object, | ||
| 4204 | + uint operand, memory_order order, | ||
| 4205 | + memory_scope scope); | ||
| 4206 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __global *object, | ||
| 4207 | + int operand, memory_order order, | ||
| 4208 | + memory_scope scope); | ||
| 4209 | +int __ovld atomic_fetch_min_explicit(volatile atomic_int __local *object, | ||
| 4210 | + int operand, memory_order order, | ||
| 4211 | + memory_scope scope); | ||
| 4212 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __global *object, | ||
| 4213 | + uint operand, memory_order order, | ||
| 4214 | + memory_scope scope); | ||
| 4215 | +uint __ovld atomic_fetch_min_explicit(volatile atomic_uint __local *object, | ||
| 4216 | + uint operand, memory_order order, | ||
| 4217 | + memory_scope scope); | ||
| 4218 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __global *object, | ||
| 4219 | + int operand, memory_order order, | ||
| 4220 | + memory_scope scope); | ||
| 4221 | +int __ovld atomic_fetch_max_explicit(volatile atomic_int __local *object, | ||
| 4222 | + int operand, memory_order order, | ||
| 4223 | + memory_scope scope); | ||
| 4224 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __global *object, | ||
| 4225 | + uint operand, memory_order order, | ||
| 4226 | + memory_scope scope); | ||
| 4227 | +uint __ovld atomic_fetch_max_explicit(volatile atomic_uint __local *object, | ||
| 4228 | + uint operand, memory_order order, | ||
| 4229 | + memory_scope scope); | ||
| 4230 | + | ||
| 4231 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4232 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4233 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __global *object, | ||
| 4234 | + long operand, memory_order order); | ||
| 4235 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __local *object, | ||
| 4236 | + long operand, memory_order order); | ||
| 4237 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __global *object, | ||
| 4238 | + ulong operand, memory_order order); | ||
| 4239 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __local *object, | ||
| 4240 | + ulong operand, memory_order order); | ||
| 4241 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __global *object, | ||
| 4242 | + long operand, memory_order order); | ||
| 4243 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __local *object, | ||
| 4244 | + long operand, memory_order order); | ||
| 4245 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __global *object, | ||
| 4246 | + ulong operand, memory_order order); | ||
| 4247 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __local *object, | ||
| 4248 | + ulong operand, memory_order order); | ||
| 4249 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __global *object, | ||
| 4250 | + long operand, memory_order order); | ||
| 4251 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __local *object, | ||
| 4252 | + long operand, memory_order order); | ||
| 4253 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __global *object, | ||
| 4254 | + ulong operand, memory_order order); | ||
| 4255 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __local *object, | ||
| 4256 | + ulong operand, memory_order order); | ||
| 4257 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __global *object, | ||
| 4258 | + long operand, memory_order order); | ||
| 4259 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __local *object, | ||
| 4260 | + long operand, memory_order order); | ||
| 4261 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __global *object, | ||
| 4262 | + ulong operand, memory_order order); | ||
| 4263 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __local *object, | ||
| 4264 | + ulong operand, memory_order order); | ||
| 4265 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __global *object, | ||
| 4266 | + long operand, memory_order order); | ||
| 4267 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __local *object, | ||
| 4268 | + long operand, memory_order order); | ||
| 4269 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __global *object, | ||
| 4270 | + ulong operand, memory_order order); | ||
| 4271 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __local *object, | ||
| 4272 | + ulong operand, memory_order order); | ||
| 4273 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __global *object, | ||
| 4274 | + long operand, memory_order order); | ||
| 4275 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __local *object, | ||
| 4276 | + long operand, memory_order order); | ||
| 4277 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __global *object, | ||
| 4278 | + ulong operand, memory_order order); | ||
| 4279 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __local *object, | ||
| 4280 | + ulong operand, memory_order order); | ||
| 4281 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __global *object, | ||
| 4282 | + long operand, memory_order order); | ||
| 4283 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __local *object, | ||
| 4284 | + long operand, memory_order order); | ||
| 4285 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __global *object, | ||
| 4286 | + ulong operand, memory_order order); | ||
| 4287 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __local *object, | ||
| 4288 | + ulong operand, memory_order order); | ||
| 4289 | +#endif // __opencl_c_atomic_scope_device | ||
| 4290 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __global *object, | ||
| 4291 | + long operand, memory_order order, | ||
| 4292 | + memory_scope scope); | ||
| 4293 | +long __ovld atomic_fetch_add_explicit(volatile atomic_long __local *object, | ||
| 4294 | + long operand, memory_order order, | ||
| 4295 | + memory_scope scope); | ||
| 4296 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __global *object, | ||
| 4297 | + ulong operand, memory_order order, | ||
| 4298 | + memory_scope scope); | ||
| 4299 | +ulong __ovld atomic_fetch_add_explicit(volatile atomic_ulong __local *object, | ||
| 4300 | + ulong operand, memory_order order, | ||
| 4301 | + memory_scope scope); | ||
| 4302 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __global *object, | ||
| 4303 | + long operand, memory_order order, | ||
| 4304 | + memory_scope scope); | ||
| 4305 | +long __ovld atomic_fetch_sub_explicit(volatile atomic_long __local *object, | ||
| 4306 | + long operand, memory_order order, | ||
| 4307 | + memory_scope scope); | ||
| 4308 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __global *object, | ||
| 4309 | + ulong operand, memory_order order, | ||
| 4310 | + memory_scope scope); | ||
| 4311 | +ulong __ovld atomic_fetch_sub_explicit(volatile atomic_ulong __local *object, | ||
| 4312 | + ulong operand, memory_order order, | ||
| 4313 | + memory_scope scope); | ||
| 4314 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __global *object, | ||
| 4315 | + long operand, memory_order order, | ||
| 4316 | + memory_scope scope); | ||
| 4317 | +long __ovld atomic_fetch_or_explicit(volatile atomic_long __local *object, | ||
| 4318 | + long operand, memory_order order, | ||
| 4319 | + memory_scope scope); | ||
| 4320 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __global *object, | ||
| 4321 | + ulong operand, memory_order order, | ||
| 4322 | + memory_scope scope); | ||
| 4323 | +ulong __ovld atomic_fetch_or_explicit(volatile atomic_ulong __local *object, | ||
| 4324 | + ulong operand, memory_order order, | ||
| 4325 | + memory_scope scope); | ||
| 4326 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __global *object, | ||
| 4327 | + long operand, memory_order order, | ||
| 4328 | + memory_scope scope); | ||
| 4329 | +long __ovld atomic_fetch_xor_explicit(volatile atomic_long __local *object, | ||
| 4330 | + long operand, memory_order order, | ||
| 4331 | + memory_scope scope); | ||
| 4332 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __global *object, | ||
| 4333 | + ulong operand, memory_order order, | ||
| 4334 | + memory_scope scope); | ||
| 4335 | +ulong __ovld atomic_fetch_xor_explicit(volatile atomic_ulong __local *object, | ||
| 4336 | + ulong operand, memory_order order, | ||
| 4337 | + memory_scope scope); | ||
| 4338 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __global *object, | ||
| 4339 | + long operand, memory_order order, | ||
| 4340 | + memory_scope scope); | ||
| 4341 | +long __ovld atomic_fetch_and_explicit(volatile atomic_long __local *object, | ||
| 4342 | + long operand, memory_order order, | ||
| 4343 | + memory_scope scope); | ||
| 4344 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __global *object, | ||
| 4345 | + ulong operand, memory_order order, | ||
| 4346 | + memory_scope scope); | ||
| 4347 | +ulong __ovld atomic_fetch_and_explicit(volatile atomic_ulong __local *object, | ||
| 4348 | + ulong operand, memory_order order, | ||
| 4349 | + memory_scope scope); | ||
| 4350 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __global *object, | ||
| 4351 | + long operand, memory_order order, | ||
| 4352 | + memory_scope scope); | ||
| 4353 | +long __ovld atomic_fetch_min_explicit(volatile atomic_long __local *object, | ||
| 4354 | + long operand, memory_order order, | ||
| 4355 | + memory_scope scope); | ||
| 4356 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __global *object, | ||
| 4357 | + ulong operand, memory_order order, | ||
| 4358 | + memory_scope scope); | ||
| 4359 | +ulong __ovld atomic_fetch_min_explicit(volatile atomic_ulong __local *object, | ||
| 4360 | + ulong operand, memory_order order, | ||
| 4361 | + memory_scope scope); | ||
| 4362 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __global *object, | ||
| 4363 | + long operand, memory_order order, | ||
| 4364 | + memory_scope scope); | ||
| 4365 | +long __ovld atomic_fetch_max_explicit(volatile atomic_long __local *object, | ||
| 4366 | + long operand, memory_order order, | ||
| 4367 | + memory_scope scope); | ||
| 4368 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __global *object, | ||
| 4369 | + ulong operand, memory_order order, | ||
| 4370 | + memory_scope scope); | ||
| 4371 | +ulong __ovld atomic_fetch_max_explicit(volatile atomic_ulong __local *object, | ||
| 4372 | + ulong operand, memory_order order, | ||
| 4373 | + memory_scope scope); | ||
| 4374 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4375 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4376 | + | ||
| 4377 | +// OpenCL v2.0 s6.13.11.7.5: | ||
| 4378 | +// add/sub: atomic type argument can be uintptr_t/intptr_t, value type argument | ||
| 4379 | +// can be ptrdiff_t. or/xor/and/min/max: atomic type argument can be | ||
| 4380 | +// intptr_t/uintptr_t, value type argument can be intptr_t/uintptr_t. | ||
| 4381 | + | ||
| 4382 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4383 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4384 | +uintptr_t __ovld | ||
| 4385 | +atomic_fetch_add_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4386 | + ptrdiff_t operand, memory_order order); | ||
| 4387 | +uintptr_t __ovld | ||
| 4388 | +atomic_fetch_add_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4389 | + ptrdiff_t operand, memory_order order); | ||
| 4390 | +uintptr_t __ovld | ||
| 4391 | +atomic_fetch_sub_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4392 | + ptrdiff_t operand, memory_order order); | ||
| 4393 | +uintptr_t __ovld | ||
| 4394 | +atomic_fetch_sub_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4395 | + ptrdiff_t operand, memory_order order); | ||
| 4396 | +uintptr_t __ovld | ||
| 4397 | +atomic_fetch_or_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4398 | + intptr_t operand, memory_order order); | ||
| 4399 | +uintptr_t __ovld | ||
| 4400 | +atomic_fetch_or_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4401 | + intptr_t operand, memory_order order); | ||
| 4402 | +uintptr_t __ovld | ||
| 4403 | +atomic_fetch_xor_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4404 | + intptr_t operand, memory_order order); | ||
| 4405 | +uintptr_t __ovld | ||
| 4406 | +atomic_fetch_xor_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4407 | + intptr_t operand, memory_order order); | ||
| 4408 | +uintptr_t __ovld | ||
| 4409 | +atomic_fetch_and_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4410 | + intptr_t operand, memory_order order); | ||
| 4411 | +uintptr_t __ovld | ||
| 4412 | +atomic_fetch_and_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4413 | + intptr_t operand, memory_order order); | ||
| 4414 | +uintptr_t __ovld | ||
| 4415 | +atomic_fetch_min_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4416 | + intptr_t opermax, memory_order minder); | ||
| 4417 | +uintptr_t __ovld | ||
| 4418 | +atomic_fetch_min_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4419 | + intptr_t opermax, memory_order minder); | ||
| 4420 | +uintptr_t __ovld | ||
| 4421 | +atomic_fetch_max_explicit(volatile atomic_uintptr_t __global *object, | ||
| 4422 | + intptr_t opermax, memory_order minder); | ||
| 4423 | +uintptr_t __ovld | ||
| 4424 | +atomic_fetch_max_explicit(volatile atomic_uintptr_t __local *object, | ||
| 4425 | + intptr_t opermax, memory_order minder); | ||
| 4426 | +intptr_t __ovld | ||
| 4427 | +atomic_fetch_or_explicit(volatile atomic_intptr_t __global *object, | ||
| 4428 | + uintptr_t operand, memory_order order); | ||
| 4429 | +intptr_t __ovld | ||
| 4430 | +atomic_fetch_or_explicit(volatile atomic_intptr_t __local *object, | ||
| 4431 | + uintptr_t operand, memory_order order); | ||
| 4432 | +intptr_t __ovld | ||
| 4433 | +atomic_fetch_xor_explicit(volatile atomic_intptr_t __global *object, | ||
| 4434 | + uintptr_t operand, memory_order order); | ||
| 4435 | +intptr_t __ovld | ||
| 4436 | +atomic_fetch_xor_explicit(volatile atomic_intptr_t __local *object, | ||
| 4437 | + uintptr_t operand, memory_order order); | ||
| 4438 | +intptr_t __ovld | ||
| 4439 | +atomic_fetch_and_explicit(volatile atomic_intptr_t __global *object, | ||
| 4440 | + uintptr_t operand, memory_order order); | ||
| 4441 | +intptr_t __ovld | ||
| 4442 | +atomic_fetch_and_explicit(volatile atomic_intptr_t __local *object, | ||
| 4443 | + uintptr_t operand, memory_order order); | ||
| 4444 | +intptr_t __ovld | ||
| 4445 | +atomic_fetch_min_explicit(volatile atomic_intptr_t __global *object, | ||
| 4446 | + uintptr_t opermax, memory_order minder); | ||
| 4447 | +intptr_t __ovld | ||
| 4448 | +atomic_fetch_min_explicit(volatile atomic_intptr_t __local *object, | ||
| 4449 | + uintptr_t opermax, memory_order minder); | ||
| 4450 | +intptr_t __ovld | ||
| 4451 | +atomic_fetch_max_explicit(volatile atomic_intptr_t __global *object, | ||
| 4452 | + uintptr_t opermax, memory_order minder); | ||
| 4453 | +intptr_t __ovld | ||
| 4454 | +atomic_fetch_max_explicit(volatile atomic_intptr_t __local *object, | ||
| 4455 | + uintptr_t opermax, memory_order minder); | ||
| 4456 | +#endif // __opencl_c_atomic_scope_device | ||
| 4457 | +uintptr_t __ovld atomic_fetch_add_explicit( | ||
| 4458 | + volatile atomic_uintptr_t __global *object, ptrdiff_t operand, | ||
| 4459 | + memory_order order, memory_scope scope); | ||
| 4460 | +uintptr_t __ovld atomic_fetch_add_explicit( | ||
| 4461 | + volatile atomic_uintptr_t __local *object, ptrdiff_t operand, | ||
| 4462 | + memory_order order, memory_scope scope); | ||
| 4463 | +uintptr_t __ovld atomic_fetch_sub_explicit( | ||
| 4464 | + volatile atomic_uintptr_t __global *object, ptrdiff_t operand, | ||
| 4465 | + memory_order order, memory_scope scope); | ||
| 4466 | +uintptr_t __ovld atomic_fetch_sub_explicit( | ||
| 4467 | + volatile atomic_uintptr_t __local *object, ptrdiff_t operand, | ||
| 4468 | + memory_order order, memory_scope scope); | ||
| 4469 | + | ||
| 4470 | +uintptr_t __ovld atomic_fetch_or_explicit( | ||
| 4471 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4472 | + memory_order order, memory_scope scope); | ||
| 4473 | +uintptr_t __ovld atomic_fetch_or_explicit( | ||
| 4474 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4475 | + memory_order order, memory_scope scope); | ||
| 4476 | +uintptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4477 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4478 | + memory_order order, memory_scope scope); | ||
| 4479 | +uintptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4480 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4481 | + memory_order order, memory_scope scope); | ||
| 4482 | +uintptr_t __ovld atomic_fetch_and_explicit( | ||
| 4483 | + volatile atomic_uintptr_t __global *object, intptr_t operand, | ||
| 4484 | + memory_order order, memory_scope scope); | ||
| 4485 | +uintptr_t __ovld atomic_fetch_and_explicit( | ||
| 4486 | + volatile atomic_uintptr_t __local *object, intptr_t operand, | ||
| 4487 | + memory_order order, memory_scope scope); | ||
| 4488 | +uintptr_t __ovld atomic_fetch_min_explicit( | ||
| 4489 | + volatile atomic_uintptr_t __global *object, intptr_t opermax, | ||
| 4490 | + memory_order minder, memory_scope scope); | ||
| 4491 | +uintptr_t __ovld atomic_fetch_min_explicit( | ||
| 4492 | + volatile atomic_uintptr_t __local *object, intptr_t opermax, | ||
| 4493 | + memory_order minder, memory_scope scope); | ||
| 4494 | +uintptr_t __ovld atomic_fetch_max_explicit( | ||
| 4495 | + volatile atomic_uintptr_t __global *object, intptr_t opermax, | ||
| 4496 | + memory_order minder, memory_scope scope); | ||
| 4497 | +uintptr_t __ovld atomic_fetch_max_explicit( | ||
| 4498 | + volatile atomic_uintptr_t __local *object, intptr_t opermax, | ||
| 4499 | + memory_order minder, memory_scope scope); | ||
| 4500 | + | ||
| 4501 | +intptr_t __ovld atomic_fetch_or_explicit( | ||
| 4502 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4503 | + memory_order order, memory_scope scope); | ||
| 4504 | +intptr_t __ovld atomic_fetch_or_explicit( | ||
| 4505 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4506 | + memory_order order, memory_scope scope); | ||
| 4507 | +intptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4508 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4509 | + memory_order order, memory_scope scope); | ||
| 4510 | +intptr_t __ovld atomic_fetch_xor_explicit( | ||
| 4511 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4512 | + memory_order order, memory_scope scope); | ||
| 4513 | +intptr_t __ovld atomic_fetch_and_explicit( | ||
| 4514 | + volatile atomic_intptr_t __global *object, uintptr_t operand, | ||
| 4515 | + memory_order order, memory_scope scope); | ||
| 4516 | +intptr_t __ovld atomic_fetch_and_explicit( | ||
| 4517 | + volatile atomic_intptr_t __local *object, uintptr_t operand, | ||
| 4518 | + memory_order order, memory_scope scope); | ||
| 4519 | +intptr_t __ovld atomic_fetch_min_explicit( | ||
| 4520 | + volatile atomic_intptr_t __global *object, uintptr_t opermax, | ||
| 4521 | + memory_order minder, memory_scope scope); | ||
| 4522 | +intptr_t __ovld atomic_fetch_min_explicit( | ||
| 4523 | + volatile atomic_intptr_t __local *object, uintptr_t opermax, | ||
| 4524 | + memory_order minder, memory_scope scope); | ||
| 4525 | +intptr_t __ovld atomic_fetch_max_explicit( | ||
| 4526 | + volatile atomic_intptr_t __global *object, uintptr_t opermax, | ||
| 4527 | + memory_order minder, memory_scope scope); | ||
| 4528 | +intptr_t __ovld atomic_fetch_max_explicit( | ||
| 4529 | + volatile atomic_intptr_t __local *object, uintptr_t opermax, | ||
| 4530 | + memory_order minder, memory_scope scope); | ||
| 4531 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4532 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4533 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4534 | |||
| 4535 | // atomic_store() | ||
| 4536 | |||
| 4537 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4538 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4539 | + | ||
| 4540 | +#ifdef __opencl_c_generic_address_space | ||
| 4541 | void __ovld atomic_store(volatile atomic_int *object, int desired); | ||
| 4542 | -void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, memory_order order); | ||
| 4543 | -void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, memory_order order, memory_scope scope); | ||
| 4544 | void __ovld atomic_store(volatile atomic_uint *object, uint desired); | ||
| 4545 | -void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, memory_order order); | ||
| 4546 | -void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, memory_order order, memory_scope scope); | ||
| 4547 | void __ovld atomic_store(volatile atomic_float *object, float desired); | ||
| 4548 | -void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, memory_order order); | ||
| 4549 | -void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, memory_order order, memory_scope scope); | ||
| 4550 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4551 | -#ifdef cl_khr_fp64 | ||
| 4552 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4553 | void __ovld atomic_store(volatile atomic_double *object, double desired); | ||
| 4554 | -void __ovld atomic_store_explicit(volatile atomic_double *object, double desired, memory_order order); | ||
| 4555 | -void __ovld atomic_store_explicit(volatile atomic_double *object, double desired, memory_order order, memory_scope scope); | ||
| 4556 | -#endif //cl_khr_fp64 | ||
| 4557 | +#endif | ||
| 4558 | void __ovld atomic_store(volatile atomic_long *object, long desired); | ||
| 4559 | -void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, memory_order order); | ||
| 4560 | -void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, memory_order order, memory_scope scope); | ||
| 4561 | void __ovld atomic_store(volatile atomic_ulong *object, ulong desired); | ||
| 4562 | -void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, memory_order order); | ||
| 4563 | -void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, memory_order order, memory_scope scope); | ||
| 4564 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4565 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4566 | +#endif // __opencl_c_generic_address_space | ||
| 4567 | + | ||
| 4568 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4569 | +void __ovld atomic_store(volatile atomic_int __global *object, int desired); | ||
| 4570 | +void __ovld atomic_store(volatile atomic_int __local *object, int desired); | ||
| 4571 | +void __ovld atomic_store(volatile atomic_uint __global *object, uint desired); | ||
| 4572 | +void __ovld atomic_store(volatile atomic_uint __local *object, uint desired); | ||
| 4573 | +void __ovld atomic_store(volatile atomic_float __global *object, float desired); | ||
| 4574 | +void __ovld atomic_store(volatile atomic_float __local *object, float desired); | ||
| 4575 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4576 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4577 | +void __ovld atomic_store(volatile atomic_double __global *object, | ||
| 4578 | + double desired); | ||
| 4579 | +void __ovld atomic_store(volatile atomic_double __local *object, | ||
| 4580 | + double desired); | ||
| 4581 | #endif | ||
| 4582 | +void __ovld atomic_store(volatile atomic_long __global *object, long desired); | ||
| 4583 | +void __ovld atomic_store(volatile atomic_long __local *object, long desired); | ||
| 4584 | +void __ovld atomic_store(volatile atomic_ulong __global *object, ulong desired); | ||
| 4585 | +void __ovld atomic_store(volatile atomic_ulong __local *object, ulong desired); | ||
| 4586 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4587 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4588 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4589 | + | ||
| 4590 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4591 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4592 | + | ||
| 4593 | +#ifdef __opencl_c_generic_address_space | ||
| 4594 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4595 | +void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, | ||
| 4596 | + memory_order order); | ||
| 4597 | +void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, | ||
| 4598 | + memory_order order); | ||
| 4599 | +void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, | ||
| 4600 | + memory_order order); | ||
| 4601 | +#endif // __opencl_c_atomic_scope_device | ||
| 4602 | +void __ovld atomic_store_explicit(volatile atomic_int *object, int desired, | ||
| 4603 | + memory_order order, memory_scope scope); | ||
| 4604 | +void __ovld atomic_store_explicit(volatile atomic_uint *object, uint desired, | ||
| 4605 | + memory_order order, memory_scope scope); | ||
| 4606 | +void __ovld atomic_store_explicit(volatile atomic_float *object, float desired, | ||
| 4607 | + memory_order order, memory_scope scope); | ||
| 4608 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4609 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4610 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4611 | +void __ovld atomic_store_explicit(volatile atomic_double *object, | ||
| 4612 | + double desired, memory_order order); | ||
| 4613 | +#endif //__opencl_c_atomic_scope_device | ||
| 4614 | +void __ovld atomic_store_explicit(volatile atomic_double *object, | ||
| 4615 | + double desired, memory_order order, | ||
| 4616 | + memory_scope scope); | ||
| 4617 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4618 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4619 | +void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, | ||
| 4620 | + memory_order order); | ||
| 4621 | +void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, | ||
| 4622 | + memory_order order); | ||
| 4623 | +#endif //__opencl_c_atomic_scope_device | ||
| 4624 | +void __ovld atomic_store_explicit(volatile atomic_long *object, long desired, | ||
| 4625 | + memory_order order, memory_scope scope); | ||
| 4626 | +void __ovld atomic_store_explicit(volatile atomic_ulong *object, ulong desired, | ||
| 4627 | + memory_order order, memory_scope scope); | ||
| 4628 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4629 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4630 | +#endif // __opencl_c_generic_address_space | ||
| 4631 | + | ||
| 4632 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4633 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4634 | +void __ovld atomic_store_explicit(volatile atomic_int __global *object, | ||
| 4635 | + int desired, memory_order order); | ||
| 4636 | +void __ovld atomic_store_explicit(volatile atomic_int __local *object, | ||
| 4637 | + int desired, memory_order order); | ||
| 4638 | +void __ovld atomic_store_explicit(volatile atomic_uint __global *object, | ||
| 4639 | + uint desired, memory_order order); | ||
| 4640 | +void __ovld atomic_store_explicit(volatile atomic_uint __local *object, | ||
| 4641 | + uint desired, memory_order order); | ||
| 4642 | +void __ovld atomic_store_explicit(volatile atomic_float __global *object, | ||
| 4643 | + float desired, memory_order order); | ||
| 4644 | +void __ovld atomic_store_explicit(volatile atomic_float __local *object, | ||
| 4645 | + float desired, memory_order order); | ||
| 4646 | +#endif // __opencl_c_atomic_scope_device | ||
| 4647 | +void __ovld atomic_store_explicit(volatile atomic_int __global *object, | ||
| 4648 | + int desired, memory_order order, | ||
| 4649 | + memory_scope scope); | ||
| 4650 | +void __ovld atomic_store_explicit(volatile atomic_int __local *object, | ||
| 4651 | + int desired, memory_order order, | ||
| 4652 | + memory_scope scope); | ||
| 4653 | +void __ovld atomic_store_explicit(volatile atomic_uint __global *object, | ||
| 4654 | + uint desired, memory_order order, | ||
| 4655 | + memory_scope scope); | ||
| 4656 | +void __ovld atomic_store_explicit(volatile atomic_uint __local *object, | ||
| 4657 | + uint desired, memory_order order, | ||
| 4658 | + memory_scope scope); | ||
| 4659 | +void __ovld atomic_store_explicit(volatile atomic_float __global *object, | ||
| 4660 | + float desired, memory_order order, | ||
| 4661 | + memory_scope scope); | ||
| 4662 | +void __ovld atomic_store_explicit(volatile atomic_float __local *object, | ||
| 4663 | + float desired, memory_order order, | ||
| 4664 | + memory_scope scope); | ||
| 4665 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4666 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4667 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4668 | +void __ovld atomic_store_explicit(volatile atomic_double __global *object, | ||
| 4669 | + double desired, memory_order order); | ||
| 4670 | +void __ovld atomic_store_explicit(volatile atomic_double __local *object, | ||
| 4671 | + double desired, memory_order order); | ||
| 4672 | +#endif //__opencl_c_atomic_scope_device | ||
| 4673 | +void __ovld atomic_store_explicit(volatile atomic_double __global *object, | ||
| 4674 | + double desired, memory_order order, | ||
| 4675 | + memory_scope scope); | ||
| 4676 | +void __ovld atomic_store_explicit(volatile atomic_double __local *object, | ||
| 4677 | + double desired, memory_order order, | ||
| 4678 | + memory_scope scope); | ||
| 4679 | +#endif // cl_khr_fp64 | ||
| 4680 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4681 | +void __ovld atomic_store_explicit(volatile atomic_long __global *object, | ||
| 4682 | + long desired, memory_order order); | ||
| 4683 | +void __ovld atomic_store_explicit(volatile atomic_long __local *object, | ||
| 4684 | + long desired, memory_order order); | ||
| 4685 | +void __ovld atomic_store_explicit(volatile atomic_ulong __global *object, | ||
| 4686 | + ulong desired, memory_order order); | ||
| 4687 | +void __ovld atomic_store_explicit(volatile atomic_ulong __local *object, | ||
| 4688 | + ulong desired, memory_order order); | ||
| 4689 | +#endif // __opencl_c_atomic_scope_device | ||
| 4690 | +void __ovld atomic_store_explicit(volatile atomic_long __global *object, | ||
| 4691 | + long desired, memory_order order, | ||
| 4692 | + memory_scope scope); | ||
| 4693 | +void __ovld atomic_store_explicit(volatile atomic_long __local *object, | ||
| 4694 | + long desired, memory_order order, | ||
| 4695 | + memory_scope scope); | ||
| 4696 | +void __ovld atomic_store_explicit(volatile atomic_ulong __global *object, | ||
| 4697 | + ulong desired, memory_order order, | ||
| 4698 | + memory_scope scope); | ||
| 4699 | +void __ovld atomic_store_explicit(volatile atomic_ulong __local *object, | ||
| 4700 | + ulong desired, memory_order order, | ||
| 4701 | + memory_scope scope); | ||
| 4702 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4703 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4704 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4705 | |||
| 4706 | // atomic_load() | ||
| 4707 | - | ||
| 4708 | +#ifdef __opencl_c_generic_address_space | ||
| 4709 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4710 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4711 | int __ovld atomic_load(volatile atomic_int *object); | ||
| 4712 | -int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order); | ||
| 4713 | -int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order, memory_scope scope); | ||
| 4714 | uint __ovld atomic_load(volatile atomic_uint *object); | ||
| 4715 | -uint __ovld atomic_load_explicit(volatile atomic_uint *object, memory_order order); | ||
| 4716 | -uint __ovld atomic_load_explicit(volatile atomic_uint *object, memory_order order, memory_scope scope); | ||
| 4717 | float __ovld atomic_load(volatile atomic_float *object); | ||
| 4718 | -float __ovld atomic_load_explicit(volatile atomic_float *object, memory_order order); | ||
| 4719 | -float __ovld atomic_load_explicit(volatile atomic_float *object, memory_order order, memory_scope scope); | ||
| 4720 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4721 | -#ifdef cl_khr_fp64 | ||
| 4722 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4723 | double __ovld atomic_load(volatile atomic_double *object); | ||
| 4724 | -double __ovld atomic_load_explicit(volatile atomic_double *object, memory_order order); | ||
| 4725 | -double __ovld atomic_load_explicit(volatile atomic_double *object, memory_order order, memory_scope scope); | ||
| 4726 | -#endif //cl_khr_fp64 | ||
| 4727 | +#endif // cl_khr_fp64 | ||
| 4728 | long __ovld atomic_load(volatile atomic_long *object); | ||
| 4729 | -long __ovld atomic_load_explicit(volatile atomic_long *object, memory_order order); | ||
| 4730 | -long __ovld atomic_load_explicit(volatile atomic_long *object, memory_order order, memory_scope scope); | ||
| 4731 | ulong __ovld atomic_load(volatile atomic_ulong *object); | ||
| 4732 | -ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, memory_order order); | ||
| 4733 | -ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, memory_order order, memory_scope scope); | ||
| 4734 | -#endif | ||
| 4735 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4736 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4737 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4738 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4739 | +#endif //__opencl_c_generic_address_space | ||
| 4740 | + | ||
| 4741 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4742 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4743 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4744 | +int __ovld atomic_load(volatile atomic_int __global *object); | ||
| 4745 | +int __ovld atomic_load(volatile atomic_int __local *object); | ||
| 4746 | +uint __ovld atomic_load(volatile atomic_uint __global *object); | ||
| 4747 | +uint __ovld atomic_load(volatile atomic_uint __local *object); | ||
| 4748 | +float __ovld atomic_load(volatile atomic_float __global *object); | ||
| 4749 | +float __ovld atomic_load(volatile atomic_float __local *object); | ||
| 4750 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4751 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4752 | +double __ovld atomic_load(volatile atomic_double __global *object); | ||
| 4753 | +double __ovld atomic_load(volatile atomic_double __local *object); | ||
| 4754 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4755 | +long __ovld atomic_load(volatile atomic_long __global *object); | ||
| 4756 | +long __ovld atomic_load(volatile atomic_long __local *object); | ||
| 4757 | +ulong __ovld atomic_load(volatile atomic_ulong __global *object); | ||
| 4758 | +ulong __ovld atomic_load(volatile atomic_ulong __local *object); | ||
| 4759 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4760 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4761 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4762 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4763 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4764 | + | ||
| 4765 | +#ifdef __opencl_c_generic_address_space | ||
| 4766 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4767 | +int __ovld atomic_load_explicit(volatile atomic_int *object, | ||
| 4768 | + memory_order order); | ||
| 4769 | +uint __ovld atomic_load_explicit(volatile atomic_uint *object, | ||
| 4770 | + memory_order order); | ||
| 4771 | +float __ovld atomic_load_explicit(volatile atomic_float *object, | ||
| 4772 | + memory_order order); | ||
| 4773 | +#endif // __opencl_c_atomic_scope_device | ||
| 4774 | +int __ovld atomic_load_explicit(volatile atomic_int *object, memory_order order, | ||
| 4775 | + memory_scope scope); | ||
| 4776 | +uint __ovld atomic_load_explicit(volatile atomic_uint *object, | ||
| 4777 | + memory_order order, memory_scope scope); | ||
| 4778 | +float __ovld atomic_load_explicit(volatile atomic_float *object, | ||
| 4779 | + memory_order order, memory_scope scope); | ||
| 4780 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4781 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4782 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4783 | +double __ovld atomic_load_explicit(volatile atomic_double *object, | ||
| 4784 | + memory_order order); | ||
| 4785 | +#endif // __opencl_c_atomic_scope_device | ||
| 4786 | +double __ovld atomic_load_explicit(volatile atomic_double *object, | ||
| 4787 | + memory_order order, memory_scope scope); | ||
| 4788 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4789 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4790 | +long __ovld atomic_load_explicit(volatile atomic_long *object, | ||
| 4791 | + memory_order order); | ||
| 4792 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, | ||
| 4793 | + memory_order order); | ||
| 4794 | +#endif //__opencl_c_atomic_scope_device | ||
| 4795 | +long __ovld atomic_load_explicit(volatile atomic_long *object, | ||
| 4796 | + memory_order order, memory_scope scope); | ||
| 4797 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong *object, | ||
| 4798 | + memory_order order, memory_scope scope); | ||
| 4799 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4800 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4801 | +#endif // __opencl_c_generic_address_space | ||
| 4802 | + | ||
| 4803 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4804 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4805 | +int __ovld atomic_load_explicit(volatile atomic_int __global *object, | ||
| 4806 | + memory_order order); | ||
| 4807 | +int __ovld atomic_load_explicit(volatile atomic_int __local *object, | ||
| 4808 | + memory_order order); | ||
| 4809 | +uint __ovld atomic_load_explicit(volatile atomic_uint __global *object, | ||
| 4810 | + memory_order order); | ||
| 4811 | +uint __ovld atomic_load_explicit(volatile atomic_uint __local *object, | ||
| 4812 | + memory_order order); | ||
| 4813 | +float __ovld atomic_load_explicit(volatile atomic_float __global *object, | ||
| 4814 | + memory_order order); | ||
| 4815 | +float __ovld atomic_load_explicit(volatile atomic_float __local *object, | ||
| 4816 | + memory_order order); | ||
| 4817 | +#endif // __opencl_c_atomic_scope_device | ||
| 4818 | +int __ovld atomic_load_explicit(volatile atomic_int __global *object, | ||
| 4819 | + memory_order order, memory_scope scope); | ||
| 4820 | +int __ovld atomic_load_explicit(volatile atomic_int __local *object, | ||
| 4821 | + memory_order order, memory_scope scope); | ||
| 4822 | +uint __ovld atomic_load_explicit(volatile atomic_uint __global *object, | ||
| 4823 | + memory_order order, memory_scope scope); | ||
| 4824 | +uint __ovld atomic_load_explicit(volatile atomic_uint __local *object, | ||
| 4825 | + memory_order order, memory_scope scope); | ||
| 4826 | +float __ovld atomic_load_explicit(volatile atomic_float __global *object, | ||
| 4827 | + memory_order order, memory_scope scope); | ||
| 4828 | +float __ovld atomic_load_explicit(volatile atomic_float __local *object, | ||
| 4829 | + memory_order order, memory_scope scope); | ||
| 4830 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4831 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4832 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4833 | +double __ovld atomic_load_explicit(volatile atomic_double __global *object, | ||
| 4834 | + memory_order order); | ||
| 4835 | +double __ovld atomic_load_explicit(volatile atomic_double __local *object, | ||
| 4836 | + memory_order order); | ||
| 4837 | +#endif // __opencl_c_atomic_scope_device | ||
| 4838 | +double __ovld atomic_load_explicit(volatile atomic_double __global *object, | ||
| 4839 | + memory_order order, memory_scope scope); | ||
| 4840 | +double __ovld atomic_load_explicit(volatile atomic_double __local *object, | ||
| 4841 | + memory_order order, memory_scope scope); | ||
| 4842 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4843 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4844 | +long __ovld atomic_load_explicit(volatile atomic_long __global *object, | ||
| 4845 | + memory_order order); | ||
| 4846 | +long __ovld atomic_load_explicit(volatile atomic_long __local *object, | ||
| 4847 | + memory_order order); | ||
| 4848 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __global *object, | ||
| 4849 | + memory_order order); | ||
| 4850 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __local *object, | ||
| 4851 | + memory_order order); | ||
| 4852 | +#endif // __opencl_c_atomic_scope_device | ||
| 4853 | +long __ovld atomic_load_explicit(volatile atomic_long __global *object, | ||
| 4854 | + memory_order order, memory_scope scope); | ||
| 4855 | +long __ovld atomic_load_explicit(volatile atomic_long __local *object, | ||
| 4856 | + memory_order order, memory_scope scope); | ||
| 4857 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __global *object, | ||
| 4858 | + memory_order order, memory_scope scope); | ||
| 4859 | +ulong __ovld atomic_load_explicit(volatile atomic_ulong __local *object, | ||
| 4860 | + memory_order order, memory_scope scope); | ||
| 4861 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4862 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4863 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4864 | |||
| 4865 | // atomic_exchange() | ||
| 4866 | - | ||
| 4867 | +#ifdef __opencl_c_generic_address_space | ||
| 4868 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4869 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4870 | int __ovld atomic_exchange(volatile atomic_int *object, int desired); | ||
| 4871 | -int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, memory_order order); | ||
| 4872 | -int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, memory_order order, memory_scope scope); | ||
| 4873 | uint __ovld atomic_exchange(volatile atomic_uint *object, uint desired); | ||
| 4874 | -uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, memory_order order); | ||
| 4875 | -uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, memory_order order, memory_scope scope); | ||
| 4876 | float __ovld atomic_exchange(volatile atomic_float *object, float desired); | ||
| 4877 | -float __ovld atomic_exchange_explicit(volatile atomic_float *object, float desired, memory_order order); | ||
| 4878 | -float __ovld atomic_exchange_explicit(volatile atomic_float *object, float desired, memory_order order, memory_scope scope); | ||
| 4879 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4880 | -#ifdef cl_khr_fp64 | ||
| 4881 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4882 | double __ovld atomic_exchange(volatile atomic_double *object, double desired); | ||
| 4883 | -double __ovld atomic_exchange_explicit(volatile atomic_double *object, double desired, memory_order order); | ||
| 4884 | -double __ovld atomic_exchange_explicit(volatile atomic_double *object, double desired, memory_order order, memory_scope scope); | ||
| 4885 | -#endif //cl_khr_fp64 | ||
| 4886 | +#endif | ||
| 4887 | long __ovld atomic_exchange(volatile atomic_long *object, long desired); | ||
| 4888 | -long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, memory_order order); | ||
| 4889 | -long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, memory_order order, memory_scope scope); | ||
| 4890 | ulong __ovld atomic_exchange(volatile atomic_ulong *object, ulong desired); | ||
| 4891 | -ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, ulong desired, memory_order order); | ||
| 4892 | -ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, ulong desired, memory_order order, memory_scope scope); | ||
| 4893 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4894 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4895 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4896 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4897 | +#endif // __opencl_c_generic_address_space | ||
| 4898 | + | ||
| 4899 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4900 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 4901 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 4902 | +int __ovld atomic_exchange(volatile atomic_int __global *object, int desired); | ||
| 4903 | +int __ovld atomic_exchange(volatile atomic_int __local *object, int desired); | ||
| 4904 | +uint __ovld atomic_exchange(volatile atomic_uint __global *object, | ||
| 4905 | + uint desired); | ||
| 4906 | +uint __ovld atomic_exchange(volatile atomic_uint __local *object, uint desired); | ||
| 4907 | +float __ovld atomic_exchange(volatile atomic_float __global *object, | ||
| 4908 | + float desired); | ||
| 4909 | +float __ovld atomic_exchange(volatile atomic_float __local *object, | ||
| 4910 | + float desired); | ||
| 4911 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4912 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4913 | +double __ovld atomic_exchange(volatile atomic_double __global *object, | ||
| 4914 | + double desired); | ||
| 4915 | +double __ovld atomic_exchange(volatile atomic_double __local *object, | ||
| 4916 | + double desired); | ||
| 4917 | #endif | ||
| 4918 | +long __ovld atomic_exchange(volatile atomic_long __global *object, | ||
| 4919 | + long desired); | ||
| 4920 | +long __ovld atomic_exchange(volatile atomic_long __local *object, long desired); | ||
| 4921 | +ulong __ovld atomic_exchange(volatile atomic_ulong __global *object, | ||
| 4922 | + ulong desired); | ||
| 4923 | +ulong __ovld atomic_exchange(volatile atomic_ulong __local *object, | ||
| 4924 | + ulong desired); | ||
| 4925 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4926 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4927 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 4928 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 4929 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4930 | + | ||
| 4931 | +#ifdef __opencl_c_generic_address_space | ||
| 4932 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4933 | +int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, | ||
| 4934 | + memory_order order); | ||
| 4935 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, | ||
| 4936 | + memory_order order); | ||
| 4937 | +float __ovld atomic_exchange_explicit(volatile atomic_float *object, | ||
| 4938 | + float desired, memory_order order); | ||
| 4939 | +#endif // __opencl_c_atomic_scope_device | ||
| 4940 | +int __ovld atomic_exchange_explicit(volatile atomic_int *object, int desired, | ||
| 4941 | + memory_order order, memory_scope scope); | ||
| 4942 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint *object, uint desired, | ||
| 4943 | + memory_order order, memory_scope scope); | ||
| 4944 | +float __ovld atomic_exchange_explicit(volatile atomic_float *object, | ||
| 4945 | + float desired, memory_order order, | ||
| 4946 | + memory_scope scope); | ||
| 4947 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 4948 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4949 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4950 | +double __ovld atomic_exchange_explicit(volatile atomic_double *object, | ||
| 4951 | + double desired, memory_order order); | ||
| 4952 | +#endif // __opencl_c_atomic_scope_device | ||
| 4953 | +double __ovld atomic_exchange_explicit(volatile atomic_double *object, | ||
| 4954 | + double desired, memory_order order, | ||
| 4955 | + memory_scope scope); | ||
| 4956 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 4957 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4958 | +long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, | ||
| 4959 | + memory_order order); | ||
| 4960 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, | ||
| 4961 | + ulong desired, memory_order order); | ||
| 4962 | +#endif // __opencl_c_atomic_scope_device | ||
| 4963 | +long __ovld atomic_exchange_explicit(volatile atomic_long *object, long desired, | ||
| 4964 | + memory_order order, memory_scope scope); | ||
| 4965 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong *object, | ||
| 4966 | + ulong desired, memory_order order, | ||
| 4967 | + memory_scope scope); | ||
| 4968 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 4969 | + // defined(cl_khr_int64_extended_atomics) | ||
| 4970 | +#endif // __opencl_c_generic_address_space | ||
| 4971 | + | ||
| 4972 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 4973 | +#ifdef __opencl_c_atomic_scope_device | ||
| 4974 | +int __ovld atomic_exchange_explicit(volatile atomic_int __global *object, | ||
| 4975 | + int desired, memory_order order); | ||
| 4976 | +int __ovld atomic_exchange_explicit(volatile atomic_int __local *object, | ||
| 4977 | + int desired, memory_order order); | ||
| 4978 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __global *object, | ||
| 4979 | + uint desired, memory_order order); | ||
| 4980 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __local *object, | ||
| 4981 | + uint desired, memory_order order); | ||
| 4982 | +float __ovld atomic_exchange_explicit(volatile atomic_float __global *object, | ||
| 4983 | + float desired, memory_order order); | ||
| 4984 | +float __ovld atomic_exchange_explicit(volatile atomic_float __local *object, | ||
| 4985 | + float desired, memory_order order); | ||
| 4986 | +#endif // __opencl_c_atomic_scope_device | ||
| 4987 | +int __ovld atomic_exchange_explicit(volatile atomic_int __global *object, | ||
| 4988 | + int desired, memory_order order, | ||
| 4989 | + memory_scope scope); | ||
| 4990 | +int __ovld atomic_exchange_explicit(volatile atomic_int __local *object, | ||
| 4991 | + int desired, memory_order order, | ||
| 4992 | + memory_scope scope); | ||
| 4993 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __global *object, | ||
| 4994 | + uint desired, memory_order order, | ||
| 4995 | + memory_scope scope); | ||
| 4996 | +uint __ovld atomic_exchange_explicit(volatile atomic_uint __local *object, | ||
| 4997 | + uint desired, memory_order order, | ||
| 4998 | + memory_scope scope); | ||
| 4999 | +float __ovld atomic_exchange_explicit(volatile atomic_float __global *object, | ||
| 5000 | + float desired, memory_order order, | ||
| 5001 | + memory_scope scope); | ||
| 5002 | +float __ovld atomic_exchange_explicit(volatile atomic_float __local *object, | ||
| 5003 | + float desired, memory_order order, | ||
| 5004 | + memory_scope scope); | ||
| 5005 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5006 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5007 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5008 | +double __ovld atomic_exchange_explicit(volatile atomic_double __global *object, | ||
| 5009 | + double desired, memory_order order); | ||
| 5010 | +double __ovld atomic_exchange_explicit(volatile atomic_double __local *object, | ||
| 5011 | + double desired, memory_order order); | ||
| 5012 | +#endif // __opencl_c_atomic_scope_device | ||
| 5013 | +double __ovld atomic_exchange_explicit(volatile atomic_double __global *object, | ||
| 5014 | + double desired, memory_order order, | ||
| 5015 | + memory_scope scope); | ||
| 5016 | +double __ovld atomic_exchange_explicit(volatile atomic_double __local *object, | ||
| 5017 | + double desired, memory_order order, | ||
| 5018 | + memory_scope scope); | ||
| 5019 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5020 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5021 | +long __ovld atomic_exchange_explicit(volatile atomic_long __global *object, | ||
| 5022 | + long desired, memory_order order); | ||
| 5023 | +long __ovld atomic_exchange_explicit(volatile atomic_long __local *object, | ||
| 5024 | + long desired, memory_order order); | ||
| 5025 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __global *object, | ||
| 5026 | + ulong desired, memory_order order); | ||
| 5027 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __local *object, | ||
| 5028 | + ulong desired, memory_order order); | ||
| 5029 | +#endif // __opencl_c_atomic_scope_device | ||
| 5030 | +long __ovld atomic_exchange_explicit(volatile atomic_long __global *object, | ||
| 5031 | + long desired, memory_order order, | ||
| 5032 | + memory_scope scope); | ||
| 5033 | +long __ovld atomic_exchange_explicit(volatile atomic_long __local *object, | ||
| 5034 | + long desired, memory_order order, | ||
| 5035 | + memory_scope scope); | ||
| 5036 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __global *object, | ||
| 5037 | + ulong desired, memory_order order, | ||
| 5038 | + memory_scope scope); | ||
| 5039 | +ulong __ovld atomic_exchange_explicit(volatile atomic_ulong __local *object, | ||
| 5040 | + ulong desired, memory_order order, | ||
| 5041 | + memory_scope scope); | ||
| 5042 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5043 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5044 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5045 | |||
| 5046 | // atomic_compare_exchange_strong() and atomic_compare_exchange_weak() | ||
| 5047 | - | ||
| 5048 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_int *object, int *expected, int desired); | ||
| 5049 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, int *expected, | ||
| 5050 | - int desired, memory_order success, memory_order failure); | ||
| 5051 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, int *expected, | ||
| 5052 | - int desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5053 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_uint *object, uint *expected, uint desired); | ||
| 5054 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5055 | - uint desired, memory_order success, memory_order failure); | ||
| 5056 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5057 | - uint desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5058 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_int *object, int *expected, int desired); | ||
| 5059 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, int *expected, | ||
| 5060 | - int desired, memory_order success, memory_order failure); | ||
| 5061 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, int *expected, | ||
| 5062 | - int desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5063 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_uint *object, uint *expected, uint desired); | ||
| 5064 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5065 | - uint desired, memory_order success, memory_order failure); | ||
| 5066 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, uint *expected, | ||
| 5067 | - uint desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5068 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_float *object, float *expected, float desired); | ||
| 5069 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_float *object, float *expected, | ||
| 5070 | - float desired, memory_order success, memory_order failure); | ||
| 5071 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_float *object, float *expected, | ||
| 5072 | - float desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5073 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_float *object, float *expected, float desired); | ||
| 5074 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, float *expected, | ||
| 5075 | - float desired, memory_order success, memory_order failure); | ||
| 5076 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, float *expected, | ||
| 5077 | - float desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5078 | +#ifdef __opencl_c_generic_address_space | ||
| 5079 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5080 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5081 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int *object, | ||
| 5082 | + int *expected, int desired); | ||
| 5083 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint *object, | ||
| 5084 | + uint *expected, uint desired); | ||
| 5085 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int *object, | ||
| 5086 | + int *expected, int desired); | ||
| 5087 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint *object, | ||
| 5088 | + uint *expected, uint desired); | ||
| 5089 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_float *object, | ||
| 5090 | + float *expected, float desired); | ||
| 5091 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float *object, | ||
| 5092 | + float *expected, float desired); | ||
| 5093 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5094 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5095 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_double *object, | ||
| 5096 | + double *expected, double desired); | ||
| 5097 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double *object, | ||
| 5098 | + double *expected, double desired); | ||
| 5099 | +#endif | ||
| 5100 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long *object, | ||
| 5101 | + long *expected, long desired); | ||
| 5102 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long *object, | ||
| 5103 | + long *expected, long desired); | ||
| 5104 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_ulong *object, | ||
| 5105 | + ulong *expected, ulong desired); | ||
| 5106 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong *object, | ||
| 5107 | + ulong *expected, ulong desired); | ||
| 5108 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5109 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5110 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5111 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5112 | +#endif // __opencl_c_generic_address_space | ||
| 5113 | + | ||
| 5114 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5115 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5116 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5117 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5118 | + int __global *expected, int desired); | ||
| 5119 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5120 | + int __global *expected, int desired); | ||
| 5121 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5122 | + int __local *expected, int desired); | ||
| 5123 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5124 | + int __local *expected, int desired); | ||
| 5125 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __global *object, | ||
| 5126 | + int __private *expected, | ||
| 5127 | + int desired); | ||
| 5128 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_int __local *object, | ||
| 5129 | + int __private *expected, | ||
| 5130 | + int desired); | ||
| 5131 | +bool __ovld | ||
| 5132 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5133 | + uint __global *expected, uint desired); | ||
| 5134 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5135 | + uint __global *expected, | ||
| 5136 | + uint desired); | ||
| 5137 | +bool __ovld | ||
| 5138 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5139 | + uint __local *expected, uint desired); | ||
| 5140 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5141 | + uint __local *expected, | ||
| 5142 | + uint desired); | ||
| 5143 | +bool __ovld | ||
| 5144 | +atomic_compare_exchange_strong(volatile atomic_uint __global *object, | ||
| 5145 | + uint __private *expected, uint desired); | ||
| 5146 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_uint __local *object, | ||
| 5147 | + uint __private *expected, | ||
| 5148 | + uint desired); | ||
| 5149 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5150 | + int __global *expected, int desired); | ||
| 5151 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5152 | + int __global *expected, int desired); | ||
| 5153 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5154 | + int __local *expected, int desired); | ||
| 5155 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5156 | + int __local *expected, int desired); | ||
| 5157 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __global *object, | ||
| 5158 | + int __private *expected, int desired); | ||
| 5159 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_int __local *object, | ||
| 5160 | + int __private *expected, int desired); | ||
| 5161 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5162 | + uint __global *expected, uint desired); | ||
| 5163 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5164 | + uint __global *expected, uint desired); | ||
| 5165 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5166 | + uint __local *expected, uint desired); | ||
| 5167 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5168 | + uint __local *expected, uint desired); | ||
| 5169 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __global *object, | ||
| 5170 | + uint __private *expected, | ||
| 5171 | + uint desired); | ||
| 5172 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_uint __local *object, | ||
| 5173 | + uint __private *expected, | ||
| 5174 | + uint desired); | ||
| 5175 | +bool __ovld | ||
| 5176 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5177 | + float __global *expected, float desired); | ||
| 5178 | +bool __ovld | ||
| 5179 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5180 | + float __global *expected, float desired); | ||
| 5181 | +bool __ovld | ||
| 5182 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5183 | + float __local *expected, float desired); | ||
| 5184 | +bool __ovld | ||
| 5185 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5186 | + float __local *expected, float desired); | ||
| 5187 | +bool __ovld | ||
| 5188 | +atomic_compare_exchange_strong(volatile atomic_float __global *object, | ||
| 5189 | + float __private *expected, float desired); | ||
| 5190 | +bool __ovld | ||
| 5191 | +atomic_compare_exchange_strong(volatile atomic_float __local *object, | ||
| 5192 | + float __private *expected, float desired); | ||
| 5193 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5194 | + float __global *expected, | ||
| 5195 | + float desired); | ||
| 5196 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5197 | + float __global *expected, | ||
| 5198 | + float desired); | ||
| 5199 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5200 | + float __local *expected, | ||
| 5201 | + float desired); | ||
| 5202 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5203 | + float __local *expected, | ||
| 5204 | + float desired); | ||
| 5205 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __global *object, | ||
| 5206 | + float __private *expected, | ||
| 5207 | + float desired); | ||
| 5208 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_float __local *object, | ||
| 5209 | + float __private *expected, | ||
| 5210 | + float desired); | ||
| 5211 | #if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5212 | -#ifdef cl_khr_fp64 | ||
| 5213 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_double *object, double *expected, double desired); | ||
| 5214 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_double *object, double *expected, | ||
| 5215 | - double desired, memory_order success, memory_order failure); | ||
| 5216 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_double *object, double *expected, | ||
| 5217 | - double desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5218 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_double *object, double *expected, double desired); | ||
| 5219 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_double *object, double *expected, | ||
| 5220 | - double desired, memory_order success, memory_order failure); | ||
| 5221 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_double *object, double *expected, | ||
| 5222 | - double desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5223 | -#endif //cl_khr_fp64 | ||
| 5224 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_long *object, long *expected, long desired); | ||
| 5225 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_long *object, long *expected, | ||
| 5226 | - long desired, memory_order success, memory_order failure); | ||
| 5227 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_long *object, long *expected, | ||
| 5228 | - long desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5229 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_long *object, long *expected, long desired); | ||
| 5230 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, long *expected, | ||
| 5231 | - long desired, memory_order success, memory_order failure); | ||
| 5232 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, long *expected, | ||
| 5233 | - long desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5234 | -bool __ovld atomic_compare_exchange_strong(volatile atomic_ulong *object, ulong *expected, ulong desired); | ||
| 5235 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5236 | - ulong desired, memory_order success, memory_order failure); | ||
| 5237 | -bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5238 | - ulong desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5239 | -bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong *object, ulong *expected, ulong desired); | ||
| 5240 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5241 | - ulong desired, memory_order success, memory_order failure); | ||
| 5242 | -bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, ulong *expected, | ||
| 5243 | - ulong desired, memory_order success, memory_order failure, memory_scope scope); | ||
| 5244 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5245 | +bool __ovld | ||
| 5246 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5247 | + double __global *expected, double desired); | ||
| 5248 | +bool __ovld | ||
| 5249 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5250 | + double __global *expected, double desired); | ||
| 5251 | +bool __ovld | ||
| 5252 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5253 | + double __local *expected, double desired); | ||
| 5254 | +bool __ovld | ||
| 5255 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5256 | + double __local *expected, double desired); | ||
| 5257 | +bool __ovld | ||
| 5258 | +atomic_compare_exchange_strong(volatile atomic_double __global *object, | ||
| 5259 | + double __private *expected, double desired); | ||
| 5260 | +bool __ovld | ||
| 5261 | +atomic_compare_exchange_strong(volatile atomic_double __local *object, | ||
| 5262 | + double __private *expected, double desired); | ||
| 5263 | +bool __ovld | ||
| 5264 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5265 | + double __global *expected, double desired); | ||
| 5266 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5267 | + double __global *expected, | ||
| 5268 | + double desired); | ||
| 5269 | +bool __ovld | ||
| 5270 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5271 | + double __local *expected, double desired); | ||
| 5272 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5273 | + double __local *expected, | ||
| 5274 | + double desired); | ||
| 5275 | +bool __ovld | ||
| 5276 | +atomic_compare_exchange_weak(volatile atomic_double __global *object, | ||
| 5277 | + double __private *expected, double desired); | ||
| 5278 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_double __local *object, | ||
| 5279 | + double __private *expected, | ||
| 5280 | + double desired); | ||
| 5281 | #endif | ||
| 5282 | +bool __ovld | ||
| 5283 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5284 | + long __global *expected, long desired); | ||
| 5285 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5286 | + long __global *expected, | ||
| 5287 | + long desired); | ||
| 5288 | +bool __ovld | ||
| 5289 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5290 | + long __local *expected, long desired); | ||
| 5291 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5292 | + long __local *expected, | ||
| 5293 | + long desired); | ||
| 5294 | +bool __ovld | ||
| 5295 | +atomic_compare_exchange_strong(volatile atomic_long __global *object, | ||
| 5296 | + long __private *expected, long desired); | ||
| 5297 | +bool __ovld atomic_compare_exchange_strong(volatile atomic_long __local *object, | ||
| 5298 | + long __private *expected, | ||
| 5299 | + long desired); | ||
| 5300 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5301 | + long __global *expected, long desired); | ||
| 5302 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5303 | + long __global *expected, long desired); | ||
| 5304 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5305 | + long __local *expected, long desired); | ||
| 5306 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5307 | + long __local *expected, long desired); | ||
| 5308 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __global *object, | ||
| 5309 | + long __private *expected, | ||
| 5310 | + long desired); | ||
| 5311 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_long __local *object, | ||
| 5312 | + long __private *expected, | ||
| 5313 | + long desired); | ||
| 5314 | +bool __ovld | ||
| 5315 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5316 | + ulong __global *expected, ulong desired); | ||
| 5317 | +bool __ovld | ||
| 5318 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5319 | + ulong __global *expected, ulong desired); | ||
| 5320 | +bool __ovld | ||
| 5321 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5322 | + ulong __local *expected, ulong desired); | ||
| 5323 | +bool __ovld | ||
| 5324 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5325 | + ulong __local *expected, ulong desired); | ||
| 5326 | +bool __ovld | ||
| 5327 | +atomic_compare_exchange_strong(volatile atomic_ulong __global *object, | ||
| 5328 | + ulong __private *expected, ulong desired); | ||
| 5329 | +bool __ovld | ||
| 5330 | +atomic_compare_exchange_strong(volatile atomic_ulong __local *object, | ||
| 5331 | + ulong __private *expected, ulong desired); | ||
| 5332 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5333 | + ulong __global *expected, | ||
| 5334 | + ulong desired); | ||
| 5335 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5336 | + ulong __global *expected, | ||
| 5337 | + ulong desired); | ||
| 5338 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5339 | + ulong __local *expected, | ||
| 5340 | + ulong desired); | ||
| 5341 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5342 | + ulong __local *expected, | ||
| 5343 | + ulong desired); | ||
| 5344 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __global *object, | ||
| 5345 | + ulong __private *expected, | ||
| 5346 | + ulong desired); | ||
| 5347 | +bool __ovld atomic_compare_exchange_weak(volatile atomic_ulong __local *object, | ||
| 5348 | + ulong __private *expected, | ||
| 5349 | + ulong desired); | ||
| 5350 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5351 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5352 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5353 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5354 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5355 | + | ||
| 5356 | +#ifdef __opencl_c_generic_address_space | ||
| 5357 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5358 | +bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, | ||
| 5359 | + int *expected, int desired, | ||
| 5360 | + memory_order success, | ||
| 5361 | + memory_order failure); | ||
| 5362 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5363 | + volatile atomic_uint *object, uint *expected, uint desired, | ||
| 5364 | + memory_order success, memory_order failure); | ||
| 5365 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, | ||
| 5366 | + int *expected, int desired, | ||
| 5367 | + memory_order success, | ||
| 5368 | + memory_order failure); | ||
| 5369 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, | ||
| 5370 | + uint *expected, uint desired, | ||
| 5371 | + memory_order success, | ||
| 5372 | + memory_order failure); | ||
| 5373 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5374 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5375 | + memory_order success, memory_order failure); | ||
| 5376 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_float *object, | ||
| 5377 | + float *expected, | ||
| 5378 | + float desired, | ||
| 5379 | + memory_order success, | ||
| 5380 | + memory_order failure); | ||
| 5381 | +#endif // __opencl_c_atomic_scope_device | ||
| 5382 | +bool __ovld atomic_compare_exchange_strong_explicit(volatile atomic_int *object, | ||
| 5383 | + int *expected, int desired, | ||
| 5384 | + memory_order success, | ||
| 5385 | + memory_order failure, | ||
| 5386 | + memory_scope scope); | ||
| 5387 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5388 | + volatile atomic_uint *object, uint *expected, uint desired, | ||
| 5389 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5390 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_int *object, | ||
| 5391 | + int *expected, int desired, | ||
| 5392 | + memory_order success, | ||
| 5393 | + memory_order failure, | ||
| 5394 | + memory_scope scope); | ||
| 5395 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_uint *object, | ||
| 5396 | + uint *expected, uint desired, | ||
| 5397 | + memory_order success, | ||
| 5398 | + memory_order failure, | ||
| 5399 | + memory_scope scope); | ||
| 5400 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5401 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5402 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5403 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5404 | + volatile atomic_float *object, float *expected, float desired, | ||
| 5405 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5406 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5407 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5408 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5409 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5410 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5411 | + memory_order success, memory_order failure); | ||
| 5412 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5413 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5414 | + memory_order success, memory_order failure); | ||
| 5415 | +#endif // __opencl_c_atomic_scope_device | ||
| 5416 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5417 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5418 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5419 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5420 | + volatile atomic_double *object, double *expected, double desired, | ||
| 5421 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5422 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5423 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5424 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5425 | + volatile atomic_long *object, long *expected, long desired, | ||
| 5426 | + memory_order success, memory_order failure); | ||
| 5427 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, | ||
| 5428 | + long *expected, long desired, | ||
| 5429 | + memory_order success, | ||
| 5430 | + memory_order failure); | ||
| 5431 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5432 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5433 | + memory_order success, memory_order failure); | ||
| 5434 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_ulong *object, | ||
| 5435 | + ulong *expected, | ||
| 5436 | + ulong desired, | ||
| 5437 | + memory_order success, | ||
| 5438 | + memory_order failure); | ||
| 5439 | +#endif // __opencl_c_atomic_scope_device | ||
| 5440 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5441 | + volatile atomic_long *object, long *expected, long desired, | ||
| 5442 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5443 | +bool __ovld atomic_compare_exchange_weak_explicit(volatile atomic_long *object, | ||
| 5444 | + long *expected, long desired, | ||
| 5445 | + memory_order success, | ||
| 5446 | + memory_order failure, | ||
| 5447 | + memory_scope scope); | ||
| 5448 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5449 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5450 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5451 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5452 | + volatile atomic_ulong *object, ulong *expected, ulong desired, | ||
| 5453 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5454 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5455 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5456 | +#endif // __opencl_c_generic_address_space | ||
| 5457 | + | ||
| 5458 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5459 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5460 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5461 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5462 | + memory_order success, memory_order failure); | ||
| 5463 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5464 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5465 | + memory_order success, memory_order failure); | ||
| 5466 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5467 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5468 | + memory_order success, memory_order failure); | ||
| 5469 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5470 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5471 | + memory_order success, memory_order failure); | ||
| 5472 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5473 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5474 | + memory_order success, memory_order failure); | ||
| 5475 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5476 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5477 | + memory_order success, memory_order failure); | ||
| 5478 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5479 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5480 | + uint desired, memory_order success, memory_order failure); | ||
| 5481 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5482 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5483 | + memory_order success, memory_order failure); | ||
| 5484 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5485 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5486 | + memory_order success, memory_order failure); | ||
| 5487 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5488 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5489 | + memory_order success, memory_order failure); | ||
| 5490 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5491 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5492 | + uint desired, memory_order success, memory_order failure); | ||
| 5493 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5494 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5495 | + uint desired, memory_order success, memory_order failure); | ||
| 5496 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5497 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5498 | + memory_order success, memory_order failure); | ||
| 5499 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5500 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5501 | + memory_order success, memory_order failure); | ||
| 5502 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5503 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5504 | + memory_order success, memory_order failure); | ||
| 5505 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5506 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5507 | + memory_order success, memory_order failure); | ||
| 5508 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5509 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5510 | + memory_order success, memory_order failure); | ||
| 5511 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5512 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5513 | + memory_order success, memory_order failure); | ||
| 5514 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5515 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5516 | + uint desired, memory_order success, memory_order failure); | ||
| 5517 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5518 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5519 | + memory_order success, memory_order failure); | ||
| 5520 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5521 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5522 | + memory_order success, memory_order failure); | ||
| 5523 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5524 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5525 | + memory_order success, memory_order failure); | ||
| 5526 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5527 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5528 | + uint desired, memory_order success, memory_order failure); | ||
| 5529 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5530 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5531 | + uint desired, memory_order success, memory_order failure); | ||
| 5532 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5533 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5534 | + float desired, memory_order success, memory_order failure); | ||
| 5535 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5536 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5537 | + float desired, memory_order success, memory_order failure); | ||
| 5538 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5539 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5540 | + float desired, memory_order success, memory_order failure); | ||
| 5541 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5542 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5543 | + float desired, memory_order success, memory_order failure); | ||
| 5544 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5545 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5546 | + float desired, memory_order success, memory_order failure); | ||
| 5547 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5548 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5549 | + float desired, memory_order success, memory_order failure); | ||
| 5550 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5551 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5552 | + float desired, memory_order success, memory_order failure); | ||
| 5553 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5554 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5555 | + float desired, memory_order success, memory_order failure); | ||
| 5556 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5557 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5558 | + float desired, memory_order success, memory_order failure); | ||
| 5559 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5560 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5561 | + float desired, memory_order success, memory_order failure); | ||
| 5562 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5563 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5564 | + float desired, memory_order success, memory_order failure); | ||
| 5565 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5566 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5567 | + float desired, memory_order success, memory_order failure); | ||
| 5568 | +#endif // __opencl_c_atomic_scope_device | ||
| 5569 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5570 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5571 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5572 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5573 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5574 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5575 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5576 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5577 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5578 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5579 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5580 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5581 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5582 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5583 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5584 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5585 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5586 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5587 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5588 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5589 | + uint desired, memory_order success, memory_order failure, | ||
| 5590 | + memory_scope scope); | ||
| 5591 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5592 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5593 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5594 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5595 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5596 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5597 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5598 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5599 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5600 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5601 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5602 | + uint desired, memory_order success, memory_order failure, | ||
| 5603 | + memory_scope scope); | ||
| 5604 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5605 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5606 | + uint desired, memory_order success, memory_order failure, | ||
| 5607 | + memory_scope scope); | ||
| 5608 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5609 | + volatile atomic_int __global *object, int __global *expected, int desired, | ||
| 5610 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5611 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5612 | + volatile atomic_int __local *object, int __global *expected, int desired, | ||
| 5613 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5614 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5615 | + volatile atomic_int __global *object, int __local *expected, int desired, | ||
| 5616 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5617 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5618 | + volatile atomic_int __local *object, int __local *expected, int desired, | ||
| 5619 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5620 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5621 | + volatile atomic_int __global *object, int __private *expected, int desired, | ||
| 5622 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5623 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5624 | + volatile atomic_int __local *object, int __private *expected, int desired, | ||
| 5625 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5626 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5627 | + volatile atomic_uint __global *object, uint __global *expected, | ||
| 5628 | + uint desired, memory_order success, memory_order failure, | ||
| 5629 | + memory_scope scope); | ||
| 5630 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5631 | + volatile atomic_uint __local *object, uint __global *expected, uint desired, | ||
| 5632 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5633 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5634 | + volatile atomic_uint __global *object, uint __local *expected, uint desired, | ||
| 5635 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5636 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5637 | + volatile atomic_uint __local *object, uint __local *expected, uint desired, | ||
| 5638 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5639 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5640 | + volatile atomic_uint __global *object, uint __private *expected, | ||
| 5641 | + uint desired, memory_order success, memory_order failure, | ||
| 5642 | + memory_scope scope); | ||
| 5643 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5644 | + volatile atomic_uint __local *object, uint __private *expected, | ||
| 5645 | + uint desired, memory_order success, memory_order failure, | ||
| 5646 | + memory_scope scope); | ||
| 5647 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5648 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5649 | + float desired, memory_order success, memory_order failure, | ||
| 5650 | + memory_scope scope); | ||
| 5651 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5652 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5653 | + float desired, memory_order success, memory_order failure, | ||
| 5654 | + memory_scope scope); | ||
| 5655 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5656 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5657 | + float desired, memory_order success, memory_order failure, | ||
| 5658 | + memory_scope scope); | ||
| 5659 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5660 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5661 | + float desired, memory_order success, memory_order failure, | ||
| 5662 | + memory_scope scope); | ||
| 5663 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5664 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5665 | + float desired, memory_order success, memory_order failure, | ||
| 5666 | + memory_scope scope); | ||
| 5667 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5668 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5669 | + float desired, memory_order success, memory_order failure, | ||
| 5670 | + memory_scope scope); | ||
| 5671 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5672 | + volatile atomic_float __global *object, float __global *expected, | ||
| 5673 | + float desired, memory_order success, memory_order failure, | ||
| 5674 | + memory_scope scope); | ||
| 5675 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5676 | + volatile atomic_float __local *object, float __global *expected, | ||
| 5677 | + float desired, memory_order success, memory_order failure, | ||
| 5678 | + memory_scope scope); | ||
| 5679 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5680 | + volatile atomic_float __global *object, float __local *expected, | ||
| 5681 | + float desired, memory_order success, memory_order failure, | ||
| 5682 | + memory_scope scope); | ||
| 5683 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5684 | + volatile atomic_float __local *object, float __local *expected, | ||
| 5685 | + float desired, memory_order success, memory_order failure, | ||
| 5686 | + memory_scope scope); | ||
| 5687 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5688 | + volatile atomic_float __global *object, float __private *expected, | ||
| 5689 | + float desired, memory_order success, memory_order failure, | ||
| 5690 | + memory_scope scope); | ||
| 5691 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5692 | + volatile atomic_float __local *object, float __private *expected, | ||
| 5693 | + float desired, memory_order success, memory_order failure, | ||
| 5694 | + memory_scope scope); | ||
| 5695 | +#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics) | ||
| 5696 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5697 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5698 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5699 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5700 | + double desired, memory_order success, memory_order failure); | ||
| 5701 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5702 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5703 | + double desired, memory_order success, memory_order failure); | ||
| 5704 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5705 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5706 | + double desired, memory_order success, memory_order failure); | ||
| 5707 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5708 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5709 | + double desired, memory_order success, memory_order failure); | ||
| 5710 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5711 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5712 | + double desired, memory_order success, memory_order failure); | ||
| 5713 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5714 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5715 | + double desired, memory_order success, memory_order failure); | ||
| 5716 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5717 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5718 | + double desired, memory_order success, memory_order failure); | ||
| 5719 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5720 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5721 | + double desired, memory_order success, memory_order failure); | ||
| 5722 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5723 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5724 | + double desired, memory_order success, memory_order failure); | ||
| 5725 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5726 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5727 | + double desired, memory_order success, memory_order failure); | ||
| 5728 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5729 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5730 | + double desired, memory_order success, memory_order failure); | ||
| 5731 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5732 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5733 | + double desired, memory_order success, memory_order failure); | ||
| 5734 | +#endif // __opencl_c_atomic_scope_device | ||
| 5735 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5736 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5737 | + double desired, memory_order success, memory_order failure, | ||
| 5738 | + memory_scope scope); | ||
| 5739 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5740 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5741 | + double desired, memory_order success, memory_order failure, | ||
| 5742 | + memory_scope scope); | ||
| 5743 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5744 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5745 | + double desired, memory_order success, memory_order failure, | ||
| 5746 | + memory_scope scope); | ||
| 5747 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5748 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5749 | + double desired, memory_order success, memory_order failure, | ||
| 5750 | + memory_scope scope); | ||
| 5751 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5752 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5753 | + double desired, memory_order success, memory_order failure, | ||
| 5754 | + memory_scope scope); | ||
| 5755 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5756 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5757 | + double desired, memory_order success, memory_order failure, | ||
| 5758 | + memory_scope scope); | ||
| 5759 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5760 | + volatile atomic_double __global *object, double __global *expected, | ||
| 5761 | + double desired, memory_order success, memory_order failure, | ||
| 5762 | + memory_scope scope); | ||
| 5763 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5764 | + volatile atomic_double __local *object, double __global *expected, | ||
| 5765 | + double desired, memory_order success, memory_order failure, | ||
| 5766 | + memory_scope scope); | ||
| 5767 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5768 | + volatile atomic_double __global *object, double __local *expected, | ||
| 5769 | + double desired, memory_order success, memory_order failure, | ||
| 5770 | + memory_scope scope); | ||
| 5771 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5772 | + volatile atomic_double __local *object, double __local *expected, | ||
| 5773 | + double desired, memory_order success, memory_order failure, | ||
| 5774 | + memory_scope scope); | ||
| 5775 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5776 | + volatile atomic_double __global *object, double __private *expected, | ||
| 5777 | + double desired, memory_order success, memory_order failure, | ||
| 5778 | + memory_scope scope); | ||
| 5779 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5780 | + volatile atomic_double __local *object, double __private *expected, | ||
| 5781 | + double desired, memory_order success, memory_order failure, | ||
| 5782 | + memory_scope scope); | ||
| 5783 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 5784 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5785 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5786 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5787 | + long desired, memory_order success, memory_order failure); | ||
| 5788 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5789 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5790 | + memory_order success, memory_order failure); | ||
| 5791 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5792 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5793 | + memory_order success, memory_order failure); | ||
| 5794 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5795 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5796 | + memory_order success, memory_order failure); | ||
| 5797 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5798 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5799 | + long desired, memory_order success, memory_order failure); | ||
| 5800 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5801 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5802 | + long desired, memory_order success, memory_order failure); | ||
| 5803 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5804 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5805 | + long desired, memory_order success, memory_order failure); | ||
| 5806 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5807 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5808 | + memory_order success, memory_order failure); | ||
| 5809 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5810 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5811 | + memory_order success, memory_order failure); | ||
| 5812 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5813 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5814 | + memory_order success, memory_order failure); | ||
| 5815 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5816 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5817 | + long desired, memory_order success, memory_order failure); | ||
| 5818 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5819 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5820 | + long desired, memory_order success, memory_order failure); | ||
| 5821 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5822 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5823 | + ulong desired, memory_order success, memory_order failure); | ||
| 5824 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5825 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5826 | + ulong desired, memory_order success, memory_order failure); | ||
| 5827 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5828 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5829 | + ulong desired, memory_order success, memory_order failure); | ||
| 5830 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5831 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5832 | + ulong desired, memory_order success, memory_order failure); | ||
| 5833 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5834 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5835 | + ulong desired, memory_order success, memory_order failure); | ||
| 5836 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5837 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5838 | + ulong desired, memory_order success, memory_order failure); | ||
| 5839 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5840 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5841 | + ulong desired, memory_order success, memory_order failure); | ||
| 5842 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5843 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5844 | + ulong desired, memory_order success, memory_order failure); | ||
| 5845 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5846 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5847 | + ulong desired, memory_order success, memory_order failure); | ||
| 5848 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5849 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5850 | + ulong desired, memory_order success, memory_order failure); | ||
| 5851 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5852 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5853 | + ulong desired, memory_order success, memory_order failure); | ||
| 5854 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5855 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5856 | + ulong desired, memory_order success, memory_order failure); | ||
| 5857 | +#endif // __opencl_c_atomic_scope_device | ||
| 5858 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5859 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5860 | + long desired, memory_order success, memory_order failure, | ||
| 5861 | + memory_scope scope); | ||
| 5862 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5863 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5864 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5865 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5866 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5867 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5868 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5869 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5870 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5871 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5872 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5873 | + long desired, memory_order success, memory_order failure, | ||
| 5874 | + memory_scope scope); | ||
| 5875 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5876 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5877 | + long desired, memory_order success, memory_order failure, | ||
| 5878 | + memory_scope scope); | ||
| 5879 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5880 | + volatile atomic_long __global *object, long __global *expected, | ||
| 5881 | + long desired, memory_order success, memory_order failure, | ||
| 5882 | + memory_scope scope); | ||
| 5883 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5884 | + volatile atomic_long __local *object, long __global *expected, long desired, | ||
| 5885 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5886 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5887 | + volatile atomic_long __global *object, long __local *expected, long desired, | ||
| 5888 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5889 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5890 | + volatile atomic_long __local *object, long __local *expected, long desired, | ||
| 5891 | + memory_order success, memory_order failure, memory_scope scope); | ||
| 5892 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5893 | + volatile atomic_long __global *object, long __private *expected, | ||
| 5894 | + long desired, memory_order success, memory_order failure, | ||
| 5895 | + memory_scope scope); | ||
| 5896 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5897 | + volatile atomic_long __local *object, long __private *expected, | ||
| 5898 | + long desired, memory_order success, memory_order failure, | ||
| 5899 | + memory_scope scope); | ||
| 5900 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5901 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5902 | + ulong desired, memory_order success, memory_order failure, | ||
| 5903 | + memory_scope scope); | ||
| 5904 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5905 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5906 | + ulong desired, memory_order success, memory_order failure, | ||
| 5907 | + memory_scope scope); | ||
| 5908 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5909 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5910 | + ulong desired, memory_order success, memory_order failure, | ||
| 5911 | + memory_scope scope); | ||
| 5912 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5913 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5914 | + ulong desired, memory_order success, memory_order failure, | ||
| 5915 | + memory_scope scope); | ||
| 5916 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5917 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5918 | + ulong desired, memory_order success, memory_order failure, | ||
| 5919 | + memory_scope scope); | ||
| 5920 | +bool __ovld atomic_compare_exchange_strong_explicit( | ||
| 5921 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5922 | + ulong desired, memory_order success, memory_order failure, | ||
| 5923 | + memory_scope scope); | ||
| 5924 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5925 | + volatile atomic_ulong __global *object, ulong __global *expected, | ||
| 5926 | + ulong desired, memory_order success, memory_order failure, | ||
| 5927 | + memory_scope scope); | ||
| 5928 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5929 | + volatile atomic_ulong __local *object, ulong __global *expected, | ||
| 5930 | + ulong desired, memory_order success, memory_order failure, | ||
| 5931 | + memory_scope scope); | ||
| 5932 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5933 | + volatile atomic_ulong __global *object, ulong __local *expected, | ||
| 5934 | + ulong desired, memory_order success, memory_order failure, | ||
| 5935 | + memory_scope scope); | ||
| 5936 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5937 | + volatile atomic_ulong __local *object, ulong __local *expected, | ||
| 5938 | + ulong desired, memory_order success, memory_order failure, | ||
| 5939 | + memory_scope scope); | ||
| 5940 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5941 | + volatile atomic_ulong __global *object, ulong __private *expected, | ||
| 5942 | + ulong desired, memory_order success, memory_order failure, | ||
| 5943 | + memory_scope scope); | ||
| 5944 | +bool __ovld atomic_compare_exchange_weak_explicit( | ||
| 5945 | + volatile atomic_ulong __local *object, ulong __private *expected, | ||
| 5946 | + ulong desired, memory_order success, memory_order failure, | ||
| 5947 | + memory_scope scope); | ||
| 5948 | +#endif // defined(cl_khr_int64_base_atomics) && | ||
| 5949 | + // defined(cl_khr_int64_extended_atomics) | ||
| 5950 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5951 | |||
| 5952 | // atomic_flag_test_and_set() and atomic_flag_clear() | ||
| 5953 | - | ||
| 5954 | +#if defined(__opencl_c_atomic_scope_device) && \ | ||
| 5955 | + defined(__opencl_c_atomic_order_seq_cst) | ||
| 5956 | +#ifdef __opencl_c_generic_address_space | ||
| 5957 | bool __ovld atomic_flag_test_and_set(volatile atomic_flag *object); | ||
| 5958 | -bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, memory_order order); | ||
| 5959 | -bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, memory_order order, memory_scope scope); | ||
| 5960 | void __ovld atomic_flag_clear(volatile atomic_flag *object); | ||
| 5961 | -void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, memory_order order); | ||
| 5962 | -void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, memory_order order, memory_scope scope); | ||
| 5963 | +#endif // __opencl_c_generic_address_space | ||
| 5964 | + | ||
| 5965 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5966 | +bool __ovld atomic_flag_test_and_set(volatile atomic_flag __global *object); | ||
| 5967 | +bool __ovld atomic_flag_test_and_set(volatile atomic_flag __local *object); | ||
| 5968 | +void __ovld atomic_flag_clear(volatile atomic_flag __global *object); | ||
| 5969 | +void __ovld atomic_flag_clear(volatile atomic_flag __local *object); | ||
| 5970 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5971 | +#endif // defined(__opencl_c_atomic_scope_device) && | ||
| 5972 | + // defined(__opencl_c_atomic_order_seq_cst) | ||
| 5973 | + | ||
| 5974 | +#ifdef __opencl_c_generic_address_space | ||
| 5975 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5976 | +bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, | ||
| 5977 | + memory_order order); | ||
| 5978 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, | ||
| 5979 | + memory_order order); | ||
| 5980 | +#endif // __opencl_c_atomic_scope_device | ||
| 5981 | +bool __ovld atomic_flag_test_and_set_explicit(volatile atomic_flag *object, | ||
| 5982 | + memory_order order, | ||
| 5983 | + memory_scope scope); | ||
| 5984 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag *object, | ||
| 5985 | + memory_order order, memory_scope scope); | ||
| 5986 | +#endif // __opencl_c_generic_address_space | ||
| 5987 | + | ||
| 5988 | +#if (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 5989 | +#ifdef __opencl_c_atomic_scope_device | ||
| 5990 | +bool __ovld atomic_flag_test_and_set_explicit( | ||
| 5991 | + volatile atomic_flag __global *object, memory_order order); | ||
| 5992 | +bool __ovld atomic_flag_test_and_set_explicit( | ||
| 5993 | + volatile atomic_flag __local *object, memory_order order); | ||
| 5994 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __global *object, | ||
| 5995 | + memory_order order); | ||
| 5996 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __local *object, | ||
| 5997 | + memory_order order); | ||
| 5998 | +#endif // __opencl_c_atomic_scope_device | ||
| 5999 | +bool __ovld | ||
| 6000 | +atomic_flag_test_and_set_explicit(volatile atomic_flag __global *object, | ||
| 6001 | + memory_order order, memory_scope scope); | ||
| 6002 | +bool __ovld | ||
| 6003 | +atomic_flag_test_and_set_explicit(volatile atomic_flag __local *object, | ||
| 6004 | + memory_order order, memory_scope scope); | ||
| 6005 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __global *object, | ||
| 6006 | + memory_order order, memory_scope scope); | ||
| 6007 | +void __ovld atomic_flag_clear_explicit(volatile atomic_flag __local *object, | ||
| 6008 | + memory_order order, memory_scope scope); | ||
| 6009 | +#endif // (__OPENCL_C_VERSION__ >= CL_VERSION_3_0) | ||
| 6010 | |||
| 6011 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6012 | |||
| 6013 | @@ -13906,7 +15943,7 @@ float16 __ovld __cnfn shuffle(float4 x, uint16 mask); | ||
| 6014 | float16 __ovld __cnfn shuffle(float8 x, uint16 mask); | ||
| 6015 | float16 __ovld __cnfn shuffle(float16 x, uint16 mask); | ||
| 6016 | |||
| 6017 | -#ifdef cl_khr_fp64 | ||
| 6018 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6019 | double2 __ovld __cnfn shuffle(double2 x, ulong2 mask); | ||
| 6020 | double2 __ovld __cnfn shuffle(double4 x, ulong2 mask); | ||
| 6021 | double2 __ovld __cnfn shuffle(double8 x, ulong2 mask); | ||
| 6022 | @@ -13926,7 +15963,7 @@ double16 __ovld __cnfn shuffle(double2 x, ulong16 mask); | ||
| 6023 | double16 __ovld __cnfn shuffle(double4 x, ulong16 mask); | ||
| 6024 | double16 __ovld __cnfn shuffle(double8 x, ulong16 mask); | ||
| 6025 | double16 __ovld __cnfn shuffle(double16 x, ulong16 mask); | ||
| 6026 | -#endif //cl_khr_fp64 | ||
| 6027 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6028 | |||
| 6029 | #ifdef cl_khr_fp16 | ||
| 6030 | half2 __ovld __cnfn shuffle(half2 x, ushort2 mask); | ||
| 6031 | @@ -14130,7 +16167,7 @@ float16 __ovld __cnfn shuffle2(float4 x, float4 y, uint16 mask); | ||
| 6032 | float16 __ovld __cnfn shuffle2(float8 x, float8 y, uint16 mask); | ||
| 6033 | float16 __ovld __cnfn shuffle2(float16 x, float16 y, uint16 mask); | ||
| 6034 | |||
| 6035 | -#ifdef cl_khr_fp64 | ||
| 6036 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6037 | double2 __ovld __cnfn shuffle2(double2 x, double2 y, ulong2 mask); | ||
| 6038 | double2 __ovld __cnfn shuffle2(double4 x, double4 y, ulong2 mask); | ||
| 6039 | double2 __ovld __cnfn shuffle2(double8 x, double8 y, ulong2 mask); | ||
| 6040 | @@ -14150,7 +16187,7 @@ double16 __ovld __cnfn shuffle2(double2 x, double2 y, ulong16 mask); | ||
| 6041 | double16 __ovld __cnfn shuffle2(double4 x, double4 y, ulong16 mask); | ||
| 6042 | double16 __ovld __cnfn shuffle2(double8 x, double8 y, ulong16 mask); | ||
| 6043 | double16 __ovld __cnfn shuffle2(double16 x, double16 y, ulong16 mask); | ||
| 6044 | -#endif //cl_khr_fp64 | ||
| 6045 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6046 | |||
| 6047 | #ifdef cl_khr_fp16 | ||
| 6048 | half2 __ovld __cnfn shuffle2(half2 x, half2 y, ushort2 mask); | ||
| 6049 | @@ -14186,6 +16223,7 @@ int printf(__constant const char* st, ...) __attribute__((format(printf, 1, 2))) | ||
| 6050 | #pragma OPENCL EXTENSION cl_khr_gl_msaa_sharing : enable | ||
| 6051 | #endif //cl_khr_gl_msaa_sharing | ||
| 6052 | |||
| 6053 | +#ifdef __opencl_c_images | ||
| 6054 | /** | ||
| 6055 | * Use the coordinate (coord.xy) to do an element lookup in | ||
| 6056 | * the 2D image object specified by image. | ||
| 6057 | @@ -14464,6 +16502,7 @@ half4 __purefn __ovld read_imageh(read_only image1d_buffer_t image, int coord); | ||
| 6058 | |||
| 6059 | // Image read functions for read_write images | ||
| 6060 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6061 | +#ifdef __opencl_c_read_write_images | ||
| 6062 | float4 __purefn __ovld read_imagef(read_write image1d_t image, int coord); | ||
| 6063 | int4 __purefn __ovld read_imagei(read_write image1d_t image, int coord); | ||
| 6064 | uint4 __purefn __ovld read_imageui(read_write image1d_t image, int coord); | ||
| 6065 | @@ -14507,6 +16546,7 @@ float __purefn __ovld read_imagef(read_write image2d_array_msaa_depth_t image, i | ||
| 6066 | #endif //cl_khr_gl_msaa_sharing | ||
| 6067 | |||
| 6068 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6069 | +#ifdef __opencl_c_read_write_images | ||
| 6070 | #ifdef cl_khr_mipmap_image | ||
| 6071 | float4 __purefn __ovld read_imagef(read_write image1d_t image, sampler_t sampler, float coord, float lod); | ||
| 6072 | int4 __purefn __ovld read_imagei(read_write image1d_t image, sampler_t sampler, float coord, float lod); | ||
| 6073 | @@ -14557,6 +16597,7 @@ int4 __purefn __ovld read_imagei(read_write image3d_t image, sampler_t sampler, | ||
| 6074 | uint4 __purefn __ovld read_imageui(read_write image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY); | ||
| 6075 | |||
| 6076 | #endif //cl_khr_mipmap_image | ||
| 6077 | +#endif //__opencl_c_read_write_images | ||
| 6078 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6079 | |||
| 6080 | // Image read functions returning half4 type | ||
| 6081 | @@ -14568,6 +16609,7 @@ half4 __purefn __ovld read_imageh(read_write image1d_array_t image, int2 coord); | ||
| 6082 | half4 __purefn __ovld read_imageh(read_write image2d_array_t image, int4 coord); | ||
| 6083 | half4 __purefn __ovld read_imageh(read_write image1d_buffer_t image, int coord); | ||
| 6084 | #endif //cl_khr_fp16 | ||
| 6085 | +#endif //__opencl_c_read_write_images | ||
| 6086 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6087 | |||
| 6088 | /** | ||
| 6089 | @@ -14657,7 +16699,7 @@ void __ovld write_imagef(write_only image1d_array_t image_array, int2 coord, flo | ||
| 6090 | void __ovld write_imagei(write_only image1d_array_t image_array, int2 coord, int4 color); | ||
| 6091 | void __ovld write_imageui(write_only image1d_array_t image_array, int2 coord, uint4 color); | ||
| 6092 | |||
| 6093 | -#ifdef cl_khr_3d_image_writes | ||
| 6094 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6095 | void __ovld write_imagef(write_only image3d_t image, int4 coord, float4 color); | ||
| 6096 | void __ovld write_imagei(write_only image3d_t image, int4 coord, int4 color); | ||
| 6097 | void __ovld write_imageui(write_only image3d_t image, int4 coord, uint4 color); | ||
| 6098 | @@ -14690,7 +16732,7 @@ void __ovld write_imageui(write_only image2d_array_t image_array, int4 coord, in | ||
| 6099 | void __ovld write_imagef(write_only image2d_depth_t image, int2 coord, int lod, float depth); | ||
| 6100 | void __ovld write_imagef(write_only image2d_array_depth_t image, int4 coord, int lod, float depth); | ||
| 6101 | |||
| 6102 | -#ifdef cl_khr_3d_image_writes | ||
| 6103 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6104 | void __ovld write_imagef(write_only image3d_t image, int4 coord, int lod, float4 color); | ||
| 6105 | void __ovld write_imagei(write_only image3d_t image, int4 coord, int lod, int4 color); | ||
| 6106 | void __ovld write_imageui(write_only image3d_t image, int4 coord, int lod, uint4 color); | ||
| 6107 | @@ -14703,7 +16745,7 @@ void __ovld write_imageui(write_only image3d_t image, int4 coord, int lod, uint4 | ||
| 6108 | #ifdef cl_khr_fp16 | ||
| 6109 | void __ovld write_imageh(write_only image1d_t image, int coord, half4 color); | ||
| 6110 | void __ovld write_imageh(write_only image2d_t image, int2 coord, half4 color); | ||
| 6111 | -#ifdef cl_khr_3d_image_writes | ||
| 6112 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6113 | void __ovld write_imageh(write_only image3d_t image, int4 coord, half4 color); | ||
| 6114 | #endif | ||
| 6115 | void __ovld write_imageh(write_only image1d_array_t image, int2 coord, half4 color); | ||
| 6116 | @@ -14713,6 +16755,7 @@ void __ovld write_imageh(write_only image1d_buffer_t image, int coord, half4 col | ||
| 6117 | |||
| 6118 | // Image write functions for read_write images | ||
| 6119 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6120 | +#ifdef __opencl_c_read_write_images | ||
| 6121 | void __ovld write_imagef(read_write image2d_t image, int2 coord, float4 color); | ||
| 6122 | void __ovld write_imagei(read_write image2d_t image, int2 coord, int4 color); | ||
| 6123 | void __ovld write_imageui(read_write image2d_t image, int2 coord, uint4 color); | ||
| 6124 | @@ -14733,7 +16776,7 @@ void __ovld write_imagef(read_write image1d_array_t image_array, int2 coord, flo | ||
| 6125 | void __ovld write_imagei(read_write image1d_array_t image_array, int2 coord, int4 color); | ||
| 6126 | void __ovld write_imageui(read_write image1d_array_t image_array, int2 coord, uint4 color); | ||
| 6127 | |||
| 6128 | -#ifdef cl_khr_3d_image_writes | ||
| 6129 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6130 | void __ovld write_imagef(read_write image3d_t image, int4 coord, float4 color); | ||
| 6131 | void __ovld write_imagei(read_write image3d_t image, int4 coord, int4 color); | ||
| 6132 | void __ovld write_imageui(read_write image3d_t image, int4 coord, uint4 color); | ||
| 6133 | @@ -14765,7 +16808,7 @@ void __ovld write_imageui(read_write image2d_array_t image_array, int4 coord, in | ||
| 6134 | void __ovld write_imagef(read_write image2d_depth_t image, int2 coord, int lod, float color); | ||
| 6135 | void __ovld write_imagef(read_write image2d_array_depth_t image, int4 coord, int lod, float color); | ||
| 6136 | |||
| 6137 | -#ifdef cl_khr_3d_image_writes | ||
| 6138 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6139 | void __ovld write_imagef(read_write image3d_t image, int4 coord, int lod, float4 color); | ||
| 6140 | void __ovld write_imagei(read_write image3d_t image, int4 coord, int lod, int4 color); | ||
| 6141 | void __ovld write_imageui(read_write image3d_t image, int4 coord, int lod, uint4 color); | ||
| 6142 | @@ -14778,13 +16821,14 @@ void __ovld write_imageui(read_write image3d_t image, int4 coord, int lod, uint4 | ||
| 6143 | #ifdef cl_khr_fp16 | ||
| 6144 | void __ovld write_imageh(read_write image1d_t image, int coord, half4 color); | ||
| 6145 | void __ovld write_imageh(read_write image2d_t image, int2 coord, half4 color); | ||
| 6146 | -#ifdef cl_khr_3d_image_writes | ||
| 6147 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6148 | void __ovld write_imageh(read_write image3d_t image, int4 coord, half4 color); | ||
| 6149 | #endif | ||
| 6150 | void __ovld write_imageh(read_write image1d_array_t image, int2 coord, half4 color); | ||
| 6151 | void __ovld write_imageh(read_write image2d_array_t image, int4 coord, half4 color); | ||
| 6152 | void __ovld write_imageh(read_write image1d_buffer_t image, int coord, half4 color); | ||
| 6153 | #endif //cl_khr_fp16 | ||
| 6154 | +#endif //__opencl_c_read_write_images | ||
| 6155 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6156 | |||
| 6157 | // Note: In OpenCL v1.0/1.1/1.2, image argument of image query builtin functions does not have | ||
| 6158 | @@ -14798,7 +16842,7 @@ void __ovld write_imageh(read_write image1d_buffer_t image, int coord, half4 col | ||
| 6159 | int __ovld __cnfn get_image_width(read_only image1d_t image); | ||
| 6160 | int __ovld __cnfn get_image_width(read_only image1d_buffer_t image); | ||
| 6161 | int __ovld __cnfn get_image_width(read_only image2d_t image); | ||
| 6162 | -#ifdef cl_khr_3d_image_writes | ||
| 6163 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6164 | int __ovld __cnfn get_image_width(read_only image3d_t image); | ||
| 6165 | #endif | ||
| 6166 | int __ovld __cnfn get_image_width(read_only image1d_array_t image); | ||
| 6167 | @@ -14817,7 +16861,7 @@ int __ovld __cnfn get_image_width(read_only image2d_array_msaa_depth_t image); | ||
| 6168 | int __ovld __cnfn get_image_width(write_only image1d_t image); | ||
| 6169 | int __ovld __cnfn get_image_width(write_only image1d_buffer_t image); | ||
| 6170 | int __ovld __cnfn get_image_width(write_only image2d_t image); | ||
| 6171 | -#ifdef cl_khr_3d_image_writes | ||
| 6172 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6173 | int __ovld __cnfn get_image_width(write_only image3d_t image); | ||
| 6174 | #endif | ||
| 6175 | int __ovld __cnfn get_image_width(write_only image1d_array_t image); | ||
| 6176 | @@ -14834,6 +16878,7 @@ int __ovld __cnfn get_image_width(write_only image2d_array_msaa_depth_t image); | ||
| 6177 | #endif //cl_khr_gl_msaa_sharing | ||
| 6178 | |||
| 6179 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6180 | +#ifdef __opencl_c_read_write_images | ||
| 6181 | int __ovld __cnfn get_image_width(read_write image1d_t image); | ||
| 6182 | int __ovld __cnfn get_image_width(read_write image1d_buffer_t image); | ||
| 6183 | int __ovld __cnfn get_image_width(read_write image2d_t image); | ||
| 6184 | @@ -14850,6 +16895,7 @@ int __ovld __cnfn get_image_width(read_write image2d_msaa_depth_t image); | ||
| 6185 | int __ovld __cnfn get_image_width(read_write image2d_array_msaa_t image); | ||
| 6186 | int __ovld __cnfn get_image_width(read_write image2d_array_msaa_depth_t image); | ||
| 6187 | #endif //cl_khr_gl_msaa_sharing | ||
| 6188 | +#endif //__opencl_c_read_write_images | ||
| 6189 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6190 | |||
| 6191 | /** | ||
| 6192 | @@ -14870,7 +16916,7 @@ int __ovld __cnfn get_image_height(read_only image2d_array_msaa_depth_t image); | ||
| 6193 | #endif //cl_khr_gl_msaa_sharing | ||
| 6194 | |||
| 6195 | int __ovld __cnfn get_image_height(write_only image2d_t image); | ||
| 6196 | -#ifdef cl_khr_3d_image_writes | ||
| 6197 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6198 | int __ovld __cnfn get_image_height(write_only image3d_t image); | ||
| 6199 | #endif | ||
| 6200 | int __ovld __cnfn get_image_height(write_only image2d_array_t image); | ||
| 6201 | @@ -14886,6 +16932,7 @@ int __ovld __cnfn get_image_height(write_only image2d_array_msaa_depth_t image); | ||
| 6202 | #endif //cl_khr_gl_msaa_sharing | ||
| 6203 | |||
| 6204 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6205 | +#ifdef __opencl_c_read_write_images | ||
| 6206 | int __ovld __cnfn get_image_height(read_write image2d_t image); | ||
| 6207 | int __ovld __cnfn get_image_height(read_write image3d_t image); | ||
| 6208 | int __ovld __cnfn get_image_height(read_write image2d_array_t image); | ||
| 6209 | @@ -14899,6 +16946,7 @@ int __ovld __cnfn get_image_height(read_write image2d_msaa_depth_t image); | ||
| 6210 | int __ovld __cnfn get_image_height(read_write image2d_array_msaa_t image); | ||
| 6211 | int __ovld __cnfn get_image_height(read_write image2d_array_msaa_depth_t image); | ||
| 6212 | #endif //cl_khr_gl_msaa_sharing | ||
| 6213 | +#endif //__opencl_c_read_write_images | ||
| 6214 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6215 | |||
| 6216 | /** | ||
| 6217 | @@ -14906,12 +16954,14 @@ int __ovld __cnfn get_image_height(read_write image2d_array_msaa_depth_t image); | ||
| 6218 | */ | ||
| 6219 | int __ovld __cnfn get_image_depth(read_only image3d_t image); | ||
| 6220 | |||
| 6221 | -#ifdef cl_khr_3d_image_writes | ||
| 6222 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6223 | int __ovld __cnfn get_image_depth(write_only image3d_t image); | ||
| 6224 | #endif | ||
| 6225 | |||
| 6226 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6227 | +#ifdef __opencl_c_read_write_images | ||
| 6228 | int __ovld __cnfn get_image_depth(read_write image3d_t image); | ||
| 6229 | +#endif //__opencl_c_read_write_images | ||
| 6230 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6231 | |||
| 6232 | // OpenCL Extension v2.0 s9.18 - Mipmaps | ||
| 6233 | @@ -14927,13 +16977,15 @@ int __ovld get_image_num_mip_levels(read_only image3d_t image); | ||
| 6234 | |||
| 6235 | int __ovld get_image_num_mip_levels(write_only image1d_t image); | ||
| 6236 | int __ovld get_image_num_mip_levels(write_only image2d_t image); | ||
| 6237 | -#ifdef cl_khr_3d_image_writes | ||
| 6238 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6239 | int __ovld get_image_num_mip_levels(write_only image3d_t image); | ||
| 6240 | #endif | ||
| 6241 | |||
| 6242 | +#ifdef __opencl_c_read_write_images | ||
| 6243 | int __ovld get_image_num_mip_levels(read_write image1d_t image); | ||
| 6244 | int __ovld get_image_num_mip_levels(read_write image2d_t image); | ||
| 6245 | int __ovld get_image_num_mip_levels(read_write image3d_t image); | ||
| 6246 | +#endif //__opencl_c_read_write_images | ||
| 6247 | |||
| 6248 | int __ovld get_image_num_mip_levels(read_only image1d_array_t image); | ||
| 6249 | int __ovld get_image_num_mip_levels(read_only image2d_array_t image); | ||
| 6250 | @@ -14945,10 +16997,12 @@ int __ovld get_image_num_mip_levels(write_only image2d_array_t image); | ||
| 6251 | int __ovld get_image_num_mip_levels(write_only image2d_array_depth_t image); | ||
| 6252 | int __ovld get_image_num_mip_levels(write_only image2d_depth_t image); | ||
| 6253 | |||
| 6254 | +#ifdef __opencl_c_read_write_images | ||
| 6255 | int __ovld get_image_num_mip_levels(read_write image1d_array_t image); | ||
| 6256 | int __ovld get_image_num_mip_levels(read_write image2d_array_t image); | ||
| 6257 | int __ovld get_image_num_mip_levels(read_write image2d_array_depth_t image); | ||
| 6258 | int __ovld get_image_num_mip_levels(read_write image2d_depth_t image); | ||
| 6259 | +#endif //__opencl_c_read_write_images | ||
| 6260 | |||
| 6261 | #endif //cl_khr_mipmap_image | ||
| 6262 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6263 | @@ -14992,7 +17046,7 @@ int __ovld __cnfn get_image_channel_data_type(read_only image2d_array_msaa_depth | ||
| 6264 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_t image); | ||
| 6265 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_buffer_t image); | ||
| 6266 | int __ovld __cnfn get_image_channel_data_type(write_only image2d_t image); | ||
| 6267 | -#ifdef cl_khr_3d_image_writes | ||
| 6268 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6269 | int __ovld __cnfn get_image_channel_data_type(write_only image3d_t image); | ||
| 6270 | #endif | ||
| 6271 | int __ovld __cnfn get_image_channel_data_type(write_only image1d_array_t image); | ||
| 6272 | @@ -15009,6 +17063,7 @@ int __ovld __cnfn get_image_channel_data_type(write_only image2d_array_msaa_dept | ||
| 6273 | #endif //cl_khr_gl_msaa_sharing | ||
| 6274 | |||
| 6275 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6276 | +#ifdef __opencl_c_read_write_images | ||
| 6277 | int __ovld __cnfn get_image_channel_data_type(read_write image1d_t image); | ||
| 6278 | int __ovld __cnfn get_image_channel_data_type(read_write image1d_buffer_t image); | ||
| 6279 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_t image); | ||
| 6280 | @@ -15025,6 +17080,7 @@ int __ovld __cnfn get_image_channel_data_type(read_write image2d_msaa_depth_t im | ||
| 6281 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_array_msaa_t image); | ||
| 6282 | int __ovld __cnfn get_image_channel_data_type(read_write image2d_array_msaa_depth_t image); | ||
| 6283 | #endif //cl_khr_gl_msaa_sharing | ||
| 6284 | +#endif //__opencl_c_read_write_images | ||
| 6285 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6286 | |||
| 6287 | /** | ||
| 6288 | @@ -15064,7 +17120,7 @@ int __ovld __cnfn get_image_channel_order(read_only image2d_array_msaa_depth_t i | ||
| 6289 | int __ovld __cnfn get_image_channel_order(write_only image1d_t image); | ||
| 6290 | int __ovld __cnfn get_image_channel_order(write_only image1d_buffer_t image); | ||
| 6291 | int __ovld __cnfn get_image_channel_order(write_only image2d_t image); | ||
| 6292 | -#ifdef cl_khr_3d_image_writes | ||
| 6293 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6294 | int __ovld __cnfn get_image_channel_order(write_only image3d_t image); | ||
| 6295 | #endif | ||
| 6296 | int __ovld __cnfn get_image_channel_order(write_only image1d_array_t image); | ||
| 6297 | @@ -15081,6 +17137,7 @@ int __ovld __cnfn get_image_channel_order(write_only image2d_array_msaa_depth_t | ||
| 6298 | #endif //cl_khr_gl_msaa_sharing | ||
| 6299 | |||
| 6300 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6301 | +#ifdef __opencl_c_read_write_images | ||
| 6302 | int __ovld __cnfn get_image_channel_order(read_write image1d_t image); | ||
| 6303 | int __ovld __cnfn get_image_channel_order(read_write image1d_buffer_t image); | ||
| 6304 | int __ovld __cnfn get_image_channel_order(read_write image2d_t image); | ||
| 6305 | @@ -15097,6 +17154,7 @@ int __ovld __cnfn get_image_channel_order(read_write image2d_msaa_depth_t image) | ||
| 6306 | int __ovld __cnfn get_image_channel_order(read_write image2d_array_msaa_t image); | ||
| 6307 | int __ovld __cnfn get_image_channel_order(read_write image2d_array_msaa_depth_t image); | ||
| 6308 | #endif //cl_khr_gl_msaa_sharing | ||
| 6309 | +#endif //__opencl_c_read_write_images | ||
| 6310 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6311 | |||
| 6312 | /** | ||
| 6313 | @@ -15131,6 +17189,7 @@ int2 __ovld __cnfn get_image_dim(write_only image2d_array_msaa_depth_t image); | ||
| 6314 | #endif //cl_khr_gl_msaa_sharing | ||
| 6315 | |||
| 6316 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6317 | +#ifdef __opencl_c_read_write_images | ||
| 6318 | int2 __ovld __cnfn get_image_dim(read_write image2d_t image); | ||
| 6319 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_t image); | ||
| 6320 | #ifdef cl_khr_depth_images | ||
| 6321 | @@ -15143,6 +17202,7 @@ int2 __ovld __cnfn get_image_dim(read_write image2d_msaa_depth_t image); | ||
| 6322 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_t image); | ||
| 6323 | int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_depth_t image); | ||
| 6324 | #endif //cl_khr_gl_msaa_sharing | ||
| 6325 | +#endif //__opencl_c_read_write_images | ||
| 6326 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6327 | |||
| 6328 | /** | ||
| 6329 | @@ -15152,11 +17212,13 @@ int2 __ovld __cnfn get_image_dim(read_write image2d_array_msaa_depth_t image); | ||
| 6330 | * component and the w component is 0. | ||
| 6331 | */ | ||
| 6332 | int4 __ovld __cnfn get_image_dim(read_only image3d_t image); | ||
| 6333 | -#ifdef cl_khr_3d_image_writes | ||
| 6334 | +#if defined(cl_khr_3d_image_writes) || defined(__opencl_c_3d_image_writes) | ||
| 6335 | int4 __ovld __cnfn get_image_dim(write_only image3d_t image); | ||
| 6336 | #endif | ||
| 6337 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6338 | +#ifdef __opencl_c_read_write_images | ||
| 6339 | int4 __ovld __cnfn get_image_dim(read_write image3d_t image); | ||
| 6340 | +#endif //__opencl_c_read_write_images | ||
| 6341 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6342 | |||
| 6343 | /** | ||
| 6344 | @@ -15184,6 +17246,7 @@ size_t __ovld __cnfn get_image_array_size(write_only image2d_array_msaa_depth_t | ||
| 6345 | #endif //cl_khr_gl_msaa_sharing | ||
| 6346 | |||
| 6347 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6348 | +#ifdef __opencl_c_read_write_images | ||
| 6349 | size_t __ovld __cnfn get_image_array_size(read_write image1d_array_t image_array); | ||
| 6350 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_t image_array); | ||
| 6351 | #ifdef cl_khr_depth_images | ||
| 6352 | @@ -15193,6 +17256,7 @@ size_t __ovld __cnfn get_image_array_size(read_write image2d_array_depth_t image | ||
| 6353 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_msaa_t image_array); | ||
| 6354 | size_t __ovld __cnfn get_image_array_size(read_write image2d_array_msaa_depth_t image_array); | ||
| 6355 | #endif //cl_khr_gl_msaa_sharing | ||
| 6356 | +#endif //__opencl_c_read_write_images | ||
| 6357 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6358 | |||
| 6359 | /** | ||
| 6360 | @@ -15210,16 +17274,21 @@ int __ovld get_image_num_samples(write_only image2d_array_msaa_t image); | ||
| 6361 | int __ovld get_image_num_samples(write_only image2d_array_msaa_depth_t image); | ||
| 6362 | |||
| 6363 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6364 | +#ifdef __opencl_c_read_write_images | ||
| 6365 | int __ovld get_image_num_samples(read_write image2d_msaa_t image); | ||
| 6366 | int __ovld get_image_num_samples(read_write image2d_msaa_depth_t image); | ||
| 6367 | int __ovld get_image_num_samples(read_write image2d_array_msaa_t image); | ||
| 6368 | int __ovld get_image_num_samples(read_write image2d_array_msaa_depth_t image); | ||
| 6369 | +#endif //__opencl_c_read_write_images | ||
| 6370 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6371 | #endif | ||
| 6372 | |||
| 6373 | +#endif //__opencl_c_images | ||
| 6374 | + | ||
| 6375 | // OpenCL v2.0 s6.13.15 - Work-group Functions | ||
| 6376 | |||
| 6377 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6378 | +#ifdef __opencl_c_work_group_collective_functions | ||
| 6379 | int __ovld __conv work_group_all(int predicate); | ||
| 6380 | int __ovld __conv work_group_any(int predicate); | ||
| 6381 | |||
| 6382 | @@ -15243,11 +17312,11 @@ ulong __ovld __conv work_group_broadcast(ulong a, size_t x, size_t y, size_t z); | ||
| 6383 | float __ovld __conv work_group_broadcast(float a, size_t local_id); | ||
| 6384 | float __ovld __conv work_group_broadcast(float a, size_t x, size_t y); | ||
| 6385 | float __ovld __conv work_group_broadcast(float a, size_t x, size_t y, size_t z); | ||
| 6386 | -#ifdef cl_khr_fp64 | ||
| 6387 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6388 | double __ovld __conv work_group_broadcast(double a, size_t local_id); | ||
| 6389 | double __ovld __conv work_group_broadcast(double a, size_t x, size_t y); | ||
| 6390 | double __ovld __conv work_group_broadcast(double a, size_t x, size_t y, size_t z); | ||
| 6391 | -#endif //cl_khr_fp64 | ||
| 6392 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6393 | |||
| 6394 | #ifdef cl_khr_fp16 | ||
| 6395 | half __ovld __conv work_group_reduce_add(half x); | ||
| 6396 | @@ -15305,7 +17374,7 @@ float __ovld __conv work_group_scan_exclusive_max(float x); | ||
| 6397 | float __ovld __conv work_group_scan_inclusive_add(float x); | ||
| 6398 | float __ovld __conv work_group_scan_inclusive_min(float x); | ||
| 6399 | float __ovld __conv work_group_scan_inclusive_max(float x); | ||
| 6400 | -#ifdef cl_khr_fp64 | ||
| 6401 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6402 | double __ovld __conv work_group_reduce_add(double x); | ||
| 6403 | double __ovld __conv work_group_reduce_min(double x); | ||
| 6404 | double __ovld __conv work_group_reduce_max(double x); | ||
| 6405 | @@ -15315,19 +17384,18 @@ double __ovld __conv work_group_scan_exclusive_max(double x); | ||
| 6406 | double __ovld __conv work_group_scan_inclusive_add(double x); | ||
| 6407 | double __ovld __conv work_group_scan_inclusive_min(double x); | ||
| 6408 | double __ovld __conv work_group_scan_inclusive_max(double x); | ||
| 6409 | -#endif //cl_khr_fp64 | ||
| 6410 | - | ||
| 6411 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6412 | +#endif //__opencl_c_work_group_collective_functions | ||
| 6413 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6414 | |||
| 6415 | // OpenCL v2.0 s6.13.16 - Pipe Functions | ||
| 6416 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6417 | +#ifdef __opencl_c_pipes | ||
| 6418 | bool __ovld is_valid_reserve_id(reserve_id_t reserve_id); | ||
| 6419 | -#endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6420 | - | ||
| 6421 | +#endif //__opencl_c_pipes | ||
| 6422 | |||
| 6423 | // OpenCL v2.0 s6.13.17 - Enqueue Kernels | ||
| 6424 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6425 | - | ||
| 6426 | +#ifdef __opencl_c_device_enqueue | ||
| 6427 | ndrange_t __ovld ndrange_1D(size_t); | ||
| 6428 | ndrange_t __ovld ndrange_1D(size_t, size_t); | ||
| 6429 | ndrange_t __ovld ndrange_1D(size_t, size_t, size_t); | ||
| 6430 | @@ -15355,11 +17423,13 @@ bool __ovld is_valid_event (clk_event_t event); | ||
| 6431 | void __ovld capture_event_profiling_info(clk_event_t, clk_profiling_info, __global void* value); | ||
| 6432 | |||
| 6433 | queue_t __ovld get_default_queue(void); | ||
| 6434 | +#endif //__opencl_c_device_enqueue | ||
| 6435 | #endif //defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6436 | |||
| 6437 | // OpenCL Extension v2.0 s9.17 - Sub-groups | ||
| 6438 | |||
| 6439 | -#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) | ||
| 6440 | +#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups) || \ | ||
| 6441 | + defined(__opencl_c_subgroups) | ||
| 6442 | // Shared Sub Group Functions | ||
| 6443 | uint __ovld get_sub_group_size(void); | ||
| 6444 | uint __ovld get_max_sub_group_size(void); | ||
| 6445 | @@ -15445,7 +17515,7 @@ half __ovld __conv sub_group_scan_inclusive_min(half x); | ||
| 6446 | half __ovld __conv sub_group_scan_inclusive_max(half x); | ||
| 6447 | #endif //cl_khr_fp16 | ||
| 6448 | |||
| 6449 | -#ifdef cl_khr_fp64 | ||
| 6450 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6451 | double __ovld __conv sub_group_broadcast(double x, uint sub_group_local_id); | ||
| 6452 | double __ovld __conv sub_group_reduce_add(double x); | ||
| 6453 | double __ovld __conv sub_group_reduce_min(double x); | ||
| 6454 | @@ -15456,7 +17526,7 @@ double __ovld __conv sub_group_scan_exclusive_max(double x); | ||
| 6455 | double __ovld __conv sub_group_scan_inclusive_add(double x); | ||
| 6456 | double __ovld __conv sub_group_scan_inclusive_min(double x); | ||
| 6457 | double __ovld __conv sub_group_scan_inclusive_max(double x); | ||
| 6458 | -#endif //cl_khr_fp64 | ||
| 6459 | +#endif // defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6460 | |||
| 6461 | #endif //cl_khr_subgroups cl_intel_subgroups | ||
| 6462 | |||
| 6463 | @@ -16226,16 +18296,22 @@ uint16 __ovld __conv intel_sub_group_shuffle_xor( uint16 x, uint c ); | ||
| 6464 | long __ovld __conv intel_sub_group_shuffle_xor( long x, uint c ); | ||
| 6465 | ulong __ovld __conv intel_sub_group_shuffle_xor( ulong x, uint c ); | ||
| 6466 | |||
| 6467 | +#ifdef __opencl_c_images | ||
| 6468 | uint __ovld __conv intel_sub_group_block_read( read_only image2d_t image, int2 coord ); | ||
| 6469 | uint2 __ovld __conv intel_sub_group_block_read2( read_only image2d_t image, int2 coord ); | ||
| 6470 | uint4 __ovld __conv intel_sub_group_block_read4( read_only image2d_t image, int2 coord ); | ||
| 6471 | uint8 __ovld __conv intel_sub_group_block_read8( read_only image2d_t image, int2 coord ); | ||
| 6472 | +#endif //__opencl_c_images | ||
| 6473 | |||
| 6474 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6475 | +#ifdef __opencl_c_images | ||
| 6476 | +#ifdef __opencl_c_read_write_images | ||
| 6477 | uint __ovld __conv intel_sub_group_block_read(read_write image2d_t image, int2 coord); | ||
| 6478 | uint2 __ovld __conv intel_sub_group_block_read2(read_write image2d_t image, int2 coord); | ||
| 6479 | uint4 __ovld __conv intel_sub_group_block_read4(read_write image2d_t image, int2 coord); | ||
| 6480 | uint8 __ovld __conv intel_sub_group_block_read8(read_write image2d_t image, int2 coord); | ||
| 6481 | +#endif //__opencl_c_read_write_images | ||
| 6482 | +#endif //__opencl_c_images | ||
| 6483 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6484 | |||
| 6485 | uint __ovld __conv intel_sub_group_block_read( const __global uint* p ); | ||
| 6486 | @@ -16243,16 +18319,22 @@ uint2 __ovld __conv intel_sub_group_block_read2( const __global uint* p ); | ||
| 6487 | uint4 __ovld __conv intel_sub_group_block_read4( const __global uint* p ); | ||
| 6488 | uint8 __ovld __conv intel_sub_group_block_read8( const __global uint* p ); | ||
| 6489 | |||
| 6490 | +#ifdef __opencl_c_images | ||
| 6491 | void __ovld __conv intel_sub_group_block_write(write_only image2d_t image, int2 coord, uint data); | ||
| 6492 | void __ovld __conv intel_sub_group_block_write2(write_only image2d_t image, int2 coord, uint2 data); | ||
| 6493 | void __ovld __conv intel_sub_group_block_write4(write_only image2d_t image, int2 coord, uint4 data); | ||
| 6494 | void __ovld __conv intel_sub_group_block_write8(write_only image2d_t image, int2 coord, uint8 data); | ||
| 6495 | +#endif //__opencl_c_images | ||
| 6496 | |||
| 6497 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6498 | +#ifdef __opencl_c_images | ||
| 6499 | +#ifdef __opencl_c_read_write_images | ||
| 6500 | void __ovld __conv intel_sub_group_block_write(read_write image2d_t image, int2 coord, uint data); | ||
| 6501 | void __ovld __conv intel_sub_group_block_write2(read_write image2d_t image, int2 coord, uint2 data); | ||
| 6502 | void __ovld __conv intel_sub_group_block_write4(read_write image2d_t image, int2 coord, uint4 data); | ||
| 6503 | void __ovld __conv intel_sub_group_block_write8(read_write image2d_t image, int2 coord, uint8 data); | ||
| 6504 | +#endif // __opencl_c_read_write_images | ||
| 6505 | +#endif // __opencl_c_images | ||
| 6506 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6507 | |||
| 6508 | void __ovld __conv intel_sub_group_block_write( __global uint* p, uint data ); | ||
| 6509 | @@ -16267,7 +18349,7 @@ half __ovld __conv intel_sub_group_shuffle_up( half prev, half cur, uint c ); | ||
| 6510 | half __ovld __conv intel_sub_group_shuffle_xor( half x, uint c ); | ||
| 6511 | #endif | ||
| 6512 | |||
| 6513 | -#if defined(cl_khr_fp64) | ||
| 6514 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 6515 | double __ovld __conv intel_sub_group_shuffle( double x, uint c ); | ||
| 6516 | double __ovld __conv intel_sub_group_shuffle_down( double prev, double cur, uint c ); | ||
| 6517 | double __ovld __conv intel_sub_group_shuffle_up( double prev, double cur, uint c ); | ||
| 6518 | @@ -16366,16 +18448,22 @@ ushort __ovld __conv intel_sub_group_scan_inclusive_min( ushort x ); | ||
| 6519 | short __ovld __conv intel_sub_group_scan_inclusive_max( short x ); | ||
| 6520 | ushort __ovld __conv intel_sub_group_scan_inclusive_max( ushort x ); | ||
| 6521 | |||
| 6522 | +#ifdef __opencl_c_images | ||
| 6523 | uint __ovld __conv intel_sub_group_block_read_ui( read_only image2d_t image, int2 byte_coord ); | ||
| 6524 | uint2 __ovld __conv intel_sub_group_block_read_ui2( read_only image2d_t image, int2 byte_coord ); | ||
| 6525 | uint4 __ovld __conv intel_sub_group_block_read_ui4( read_only image2d_t image, int2 byte_coord ); | ||
| 6526 | uint8 __ovld __conv intel_sub_group_block_read_ui8( read_only image2d_t image, int2 byte_coord ); | ||
| 6527 | +#endif //__opencl_c_images | ||
| 6528 | |||
| 6529 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6530 | +#ifdef __opencl_c_images | ||
| 6531 | +#ifdef __opencl_c_read_write_images | ||
| 6532 | uint __ovld __conv intel_sub_group_block_read_ui( read_write image2d_t image, int2 byte_coord ); | ||
| 6533 | uint2 __ovld __conv intel_sub_group_block_read_ui2( read_write image2d_t image, int2 byte_coord ); | ||
| 6534 | uint4 __ovld __conv intel_sub_group_block_read_ui4( read_write image2d_t image, int2 byte_coord ); | ||
| 6535 | uint8 __ovld __conv intel_sub_group_block_read_ui8( read_write image2d_t image, int2 byte_coord ); | ||
| 6536 | +#endif //__opencl_c_read_write_images | ||
| 6537 | +#endif //__opencl_c_images | ||
| 6538 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6539 | |||
| 6540 | uint __ovld __conv intel_sub_group_block_read_ui( const __global uint* p ); | ||
| 6541 | @@ -16383,16 +18471,22 @@ uint2 __ovld __conv intel_sub_group_block_read_ui2( const __global uint* p | ||
| 6542 | uint4 __ovld __conv intel_sub_group_block_read_ui4( const __global uint* p ); | ||
| 6543 | uint8 __ovld __conv intel_sub_group_block_read_ui8( const __global uint* p ); | ||
| 6544 | |||
| 6545 | +#ifdef __opencl_c_images | ||
| 6546 | void __ovld __conv intel_sub_group_block_write_ui( read_only image2d_t image, int2 byte_coord, uint data ); | ||
| 6547 | void __ovld __conv intel_sub_group_block_write_ui2( read_only image2d_t image, int2 byte_coord, uint2 data ); | ||
| 6548 | void __ovld __conv intel_sub_group_block_write_ui4( read_only image2d_t image, int2 byte_coord, uint4 data ); | ||
| 6549 | void __ovld __conv intel_sub_group_block_write_ui8( read_only image2d_t image, int2 byte_coord, uint8 data ); | ||
| 6550 | +#endif //__opencl_c_images | ||
| 6551 | |||
| 6552 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6553 | +#ifdef __opencl_c_images | ||
| 6554 | +#ifdef __opencl_c_read_write_images | ||
| 6555 | void __ovld __conv intel_sub_group_block_write_ui( read_write image2d_t image, int2 byte_coord, uint data ); | ||
| 6556 | void __ovld __conv intel_sub_group_block_write_ui2( read_write image2d_t image, int2 byte_coord, uint2 data ); | ||
| 6557 | void __ovld __conv intel_sub_group_block_write_ui4( read_write image2d_t image, int2 byte_coord, uint4 data ); | ||
| 6558 | void __ovld __conv intel_sub_group_block_write_ui8( read_write image2d_t image, int2 byte_coord, uint8 data ); | ||
| 6559 | +#endif //__opencl_c_read_write_images | ||
| 6560 | +#endif //__opencl_c_images | ||
| 6561 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6562 | |||
| 6563 | void __ovld __conv intel_sub_group_block_write_ui( __global uint* p, uint data ); | ||
| 6564 | @@ -16400,16 +18494,22 @@ void __ovld __conv intel_sub_group_block_write_ui2( __global uint* p, uint | ||
| 6565 | void __ovld __conv intel_sub_group_block_write_ui4( __global uint* p, uint4 data ); | ||
| 6566 | void __ovld __conv intel_sub_group_block_write_ui8( __global uint* p, uint8 data ); | ||
| 6567 | |||
| 6568 | +#ifdef __opencl_c_images | ||
| 6569 | ushort __ovld __conv intel_sub_group_block_read_us( read_only image2d_t image, int2 coord ); | ||
| 6570 | ushort2 __ovld __conv intel_sub_group_block_read_us2( read_only image2d_t image, int2 coord ); | ||
| 6571 | ushort4 __ovld __conv intel_sub_group_block_read_us4( read_only image2d_t image, int2 coord ); | ||
| 6572 | ushort8 __ovld __conv intel_sub_group_block_read_us8( read_only image2d_t image, int2 coord ); | ||
| 6573 | +#endif //__opencl_c_images | ||
| 6574 | |||
| 6575 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6576 | +#ifdef __opencl_c_images | ||
| 6577 | +#ifdef __opencl_c_read_write_images | ||
| 6578 | ushort __ovld __conv intel_sub_group_block_read_us(read_write image2d_t image, int2 coord); | ||
| 6579 | ushort2 __ovld __conv intel_sub_group_block_read_us2(read_write image2d_t image, int2 coord); | ||
| 6580 | ushort4 __ovld __conv intel_sub_group_block_read_us4(read_write image2d_t image, int2 coord); | ||
| 6581 | ushort8 __ovld __conv intel_sub_group_block_read_us8(read_write image2d_t image, int2 coord); | ||
| 6582 | +#endif //__opencl_c_read_write_images | ||
| 6583 | +#endif //__opencl_c_images | ||
| 6584 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6585 | |||
| 6586 | ushort __ovld __conv intel_sub_group_block_read_us( const __global ushort* p ); | ||
| 6587 | @@ -16417,16 +18517,22 @@ ushort2 __ovld __conv intel_sub_group_block_read_us2( const __global ushort* | ||
| 6588 | ushort4 __ovld __conv intel_sub_group_block_read_us4( const __global ushort* p ); | ||
| 6589 | ushort8 __ovld __conv intel_sub_group_block_read_us8( const __global ushort* p ); | ||
| 6590 | |||
| 6591 | +#ifdef __opencl_c_images | ||
| 6592 | void __ovld __conv intel_sub_group_block_write_us(write_only image2d_t image, int2 coord, ushort data); | ||
| 6593 | void __ovld __conv intel_sub_group_block_write_us2(write_only image2d_t image, int2 coord, ushort2 data); | ||
| 6594 | void __ovld __conv intel_sub_group_block_write_us4(write_only image2d_t image, int2 coord, ushort4 data); | ||
| 6595 | void __ovld __conv intel_sub_group_block_write_us8(write_only image2d_t image, int2 coord, ushort8 data); | ||
| 6596 | +#endif //__opencl_c_images | ||
| 6597 | |||
| 6598 | #if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6599 | +#ifdef __opencl_c_images | ||
| 6600 | +#ifdef __opencl_c_read_write_images | ||
| 6601 | void __ovld __conv intel_sub_group_block_write_us(read_write image2d_t image, int2 coord, ushort data); | ||
| 6602 | void __ovld __conv intel_sub_group_block_write_us2(read_write image2d_t image, int2 coord, ushort2 data); | ||
| 6603 | void __ovld __conv intel_sub_group_block_write_us4(read_write image2d_t image, int2 coord, ushort4 data); | ||
| 6604 | void __ovld __conv intel_sub_group_block_write_us8(read_write image2d_t image, int2 coord, ushort8 data); | ||
| 6605 | +#endif //__opencl_c_read_write_images | ||
| 6606 | +#endif //__opencl_c_images | ||
| 6607 | #endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 6608 | |||
| 6609 | void __ovld __conv intel_sub_group_block_write_us( __global ushort* p, ushort data ); | ||
| 6610 | @@ -16545,6 +18651,7 @@ short2 __ovld intel_sub_group_avc_ime_adjust_ref_offset( | ||
| 6611 | short2 ref_offset, ushort2 src_coord, ushort2 ref_window_size, | ||
| 6612 | ushort2 image_size); | ||
| 6613 | |||
| 6614 | +#ifdef __opencl_c_images | ||
| 6615 | intel_sub_group_avc_ime_result_t __ovld | ||
| 6616 | intel_sub_group_avc_ime_evaluate_with_single_reference( | ||
| 6617 | read_only image2d_t src_image, read_only image2d_t ref_image, | ||
| 6618 | @@ -16585,6 +18692,7 @@ intel_sub_group_avc_ime_evaluate_with_dual_reference_streaminout( | ||
| 6619 | read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler, | ||
| 6620 | intel_sub_group_avc_ime_payload_t payload, | ||
| 6621 | intel_sub_group_avc_ime_dual_reference_streamin_t streamin_components); | ||
| 6622 | +#endif //__opencl_c_images | ||
| 6623 | |||
| 6624 | intel_sub_group_avc_ime_single_reference_streamin_t __ovld | ||
| 6625 | intel_sub_group_avc_ime_get_single_reference_streamin( | ||
| 6626 | @@ -16649,6 +18757,7 @@ intel_sub_group_avc_ref_payload_t __ovld | ||
| 6627 | intel_sub_group_avc_ref_set_bilinear_filter_enable( | ||
| 6628 | intel_sub_group_avc_ref_payload_t payload); | ||
| 6629 | |||
| 6630 | +#ifdef __opencl_c_images | ||
| 6631 | intel_sub_group_avc_ref_result_t __ovld | ||
| 6632 | intel_sub_group_avc_ref_evaluate_with_single_reference( | ||
| 6633 | read_only image2d_t src_image, read_only image2d_t ref_image, | ||
| 6634 | @@ -16667,6 +18776,7 @@ intel_sub_group_avc_ref_evaluate_with_multi_reference( | ||
| 6635 | read_only image2d_t src_image, uint packed_reference_ids, | ||
| 6636 | uchar packed_reference_field_polarities, sampler_t vme_media_sampler, | ||
| 6637 | intel_sub_group_avc_ref_payload_t payload); | ||
| 6638 | +#endif //__opencl_c_images | ||
| 6639 | |||
| 6640 | // SIC built-in functions | ||
| 6641 | intel_sub_group_avc_sic_payload_t __ovld | ||
| 6642 | @@ -16717,6 +18827,7 @@ intel_sub_group_avc_sic_set_block_based_raw_skip_sad( | ||
| 6643 | uchar block_based_skip_type, | ||
| 6644 | intel_sub_group_avc_sic_payload_t payload); | ||
| 6645 | |||
| 6646 | +#ifdef __opencl_c_images | ||
| 6647 | intel_sub_group_avc_sic_result_t __ovld | ||
| 6648 | intel_sub_group_avc_sic_evaluate_ipe( | ||
| 6649 | read_only image2d_t src_image, sampler_t vme_media_sampler, | ||
| 6650 | @@ -16739,6 +18850,7 @@ intel_sub_group_avc_sic_evaluate_with_multi_reference( | ||
| 6651 | read_only image2d_t src_image, uint packed_reference_ids, | ||
| 6652 | uchar packed_reference_field_polarities, sampler_t vme_media_sampler, | ||
| 6653 | intel_sub_group_avc_sic_payload_t payload); | ||
| 6654 | +#endif //__opencl_c_images | ||
| 6655 | |||
| 6656 | uchar __ovld intel_sub_group_avc_sic_get_ipe_luma_shape( | ||
| 6657 | intel_sub_group_avc_sic_result_t result); | ||
| 6658 | diff --git a/clang/lib/Parse/ParseDecl.cpp b/clang/lib/Parse/ParseDecl.cpp | ||
| 6659 | index c87d240a8206..8c8f03bba0f3 100644 | ||
| 6660 | --- a/clang/lib/Parse/ParseDecl.cpp | ||
| 6661 | +++ b/clang/lib/Parse/ParseDecl.cpp | ||
| 6662 | @@ -3799,8 +3799,7 @@ void Parser::ParseDeclarationSpecifiers(DeclSpec &DS, | ||
| 6663 | isInvalid = DS.SetTypeAltiVecBool(true, Loc, PrevSpec, DiagID, Policy); | ||
| 6664 | break; | ||
| 6665 | case tok::kw_pipe: | ||
| 6666 | - if (!getLangOpts().OpenCL || (getLangOpts().OpenCLVersion < 200 && | ||
| 6667 | - !getLangOpts().OpenCLCPlusPlus)) { | ||
| 6668 | + if (!getLangOpts().OpenCLPipeKeyword) { | ||
| 6669 | // OpenCL 2.0 defined this keyword. OpenCL 1.2 and earlier should | ||
| 6670 | // support the "pipe" word as identifier. | ||
| 6671 | Tok.getIdentifierInfo()->revertTokenIDToIdentifier(); | ||
| 6672 | @@ -3922,8 +3921,7 @@ void Parser::ParseDeclarationSpecifiers(DeclSpec &DS, | ||
| 6673 | case tok::kw___generic: | ||
| 6674 | // generic address space is introduced only in OpenCL v2.0 | ||
| 6675 | // see OpenCL C Spec v2.0 s6.5.5 | ||
| 6676 | - if (Actions.getLangOpts().OpenCLVersion < 200 && | ||
| 6677 | - !Actions.getLangOpts().OpenCLCPlusPlus) { | ||
| 6678 | + if (!Actions.getLangOpts().OpenCLGenericKeyword) { | ||
| 6679 | DiagID = diag::err_opencl_unknown_type_specifier; | ||
| 6680 | PrevSpec = Tok.getIdentifierInfo()->getNameStart(); | ||
| 6681 | isInvalid = true; | ||
| 6682 | @@ -4973,8 +4971,7 @@ bool Parser::isDeclarationSpecifier(bool DisambiguatingWithExpression) { | ||
| 6683 | default: return false; | ||
| 6684 | |||
| 6685 | case tok::kw_pipe: | ||
| 6686 | - return (getLangOpts().OpenCL && getLangOpts().OpenCLVersion >= 200) || | ||
| 6687 | - getLangOpts().OpenCLCPlusPlus; | ||
| 6688 | + return getLangOpts().OpenCLPipeKeyword; | ||
| 6689 | |||
| 6690 | case tok::identifier: // foo::bar | ||
| 6691 | // Unfortunate hack to support "Class.factoryMethod" notation. | ||
| 6692 | @@ -5499,8 +5496,7 @@ static bool isPtrOperatorToken(tok::TokenKind Kind, const LangOptions &Lang, | ||
| 6693 | if (Kind == tok::star || Kind == tok::caret) | ||
| 6694 | return true; | ||
| 6695 | |||
| 6696 | - if (Kind == tok::kw_pipe && | ||
| 6697 | - ((Lang.OpenCL && Lang.OpenCLVersion >= 200) || Lang.OpenCLCPlusPlus)) | ||
| 6698 | + if (Kind == tok::kw_pipe && Lang.OpenCLPipeKeyword) | ||
| 6699 | return true; | ||
| 6700 | |||
| 6701 | if (!Lang.CPlusPlus) | ||
| 6702 | diff --git a/clang/lib/Parse/ParsePragma.cpp b/clang/lib/Parse/ParsePragma.cpp | ||
| 6703 | index 6402b31d00b2..65f283ad556b 100644 | ||
| 6704 | --- a/clang/lib/Parse/ParsePragma.cpp | ||
| 6705 | +++ b/clang/lib/Parse/ParsePragma.cpp | ||
| 6706 | @@ -749,12 +749,14 @@ void Parser::HandlePragmaOpenCLExtension() { | ||
| 6707 | if (Name == "all") { | ||
| 6708 | if (State == Disable) { | ||
| 6709 | Opt.disableAll(); | ||
| 6710 | - Opt.enableSupportedCore(getLangOpts()); | ||
| 6711 | + Opt.enableSupportedCore(); | ||
| 6712 | } else { | ||
| 6713 | PP.Diag(NameLoc, diag::warn_pragma_expected_predicate) << 1; | ||
| 6714 | } | ||
| 6715 | + } else if (Opt.isFeature(Name)) { | ||
| 6716 | + PP.Diag(NameLoc, diag::warn_opencl_pragma_feature_ignore) << Ident; | ||
| 6717 | } else if (State == Begin) { | ||
| 6718 | - if (!Opt.isKnown(Name) || !Opt.isSupported(Name, getLangOpts())) { | ||
| 6719 | + if (!Opt.isKnown(Name) || !Opt.isSupported(Name)) { | ||
| 6720 | Opt.support(Name); | ||
| 6721 | } | ||
| 6722 | Actions.setCurrentOpenCLExtension(Name); | ||
| 6723 | @@ -764,9 +766,9 @@ void Parser::HandlePragmaOpenCLExtension() { | ||
| 6724 | Actions.setCurrentOpenCLExtension(""); | ||
| 6725 | } else if (!Opt.isKnown(Name)) | ||
| 6726 | PP.Diag(NameLoc, diag::warn_pragma_unknown_extension) << Ident; | ||
| 6727 | - else if (Opt.isSupportedExtension(Name, getLangOpts())) | ||
| 6728 | + else if (Opt.isSupportedExtension(Name)) | ||
| 6729 | Opt.enable(Name, State == Enable); | ||
| 6730 | - else if (Opt.isSupportedCore(Name, getLangOpts())) | ||
| 6731 | + else if (Opt.isSupportedCore(Name)) | ||
| 6732 | PP.Diag(NameLoc, diag::warn_pragma_extension_is_core) << Ident; | ||
| 6733 | else | ||
| 6734 | PP.Diag(NameLoc, diag::warn_pragma_unsupported_extension) << Ident; | ||
| 6735 | diff --git a/clang/lib/Sema/OpenCLBuiltins.td b/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6736 | index 745363a6b43f..6a1fce567090 100644 | ||
| 6737 | --- a/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6738 | +++ b/clang/lib/Sema/OpenCLBuiltins.td | ||
| 6739 | @@ -22,11 +22,13 @@ | ||
| 6740 | class Version<int _Version> { | ||
| 6741 | int ID = _Version; | ||
| 6742 | } | ||
| 6743 | + | ||
| 6744 | def CLAll : Version< 0>; | ||
| 6745 | def CL10 : Version<100>; | ||
| 6746 | def CL11 : Version<110>; | ||
| 6747 | def CL12 : Version<120>; | ||
| 6748 | def CL20 : Version<200>; | ||
| 6749 | +def CL30 : Version<300>; | ||
| 6750 | |||
| 6751 | // Address spaces | ||
| 6752 | // Pointer types need to be assigned an address space. | ||
| 6753 | @@ -72,6 +74,14 @@ def ArmIntegerDotProductAccumulateInt8 : FunctionExtension<"cl_arm_integ | ||
| 6754 | def ArmIntegerDotProductAccumulateInt16 : FunctionExtension<"cl_arm_integer_dot_product_accumulate_int16">; | ||
| 6755 | def ArmIntegerDotProductAccumulateSaturateInt8 : FunctionExtension<"cl_arm_integer_dot_product_accumulate_saturate_int8">; | ||
| 6756 | |||
| 6757 | +// Features | ||
| 6758 | +def FuncExtGenericAddressSpace : FunctionExtension<"__opencl_c_generic_address_space">; | ||
| 6759 | +def FuncExtWorkGroupCollective : FunctionExtension<"__opencl_c_work_group_collective_functions">; | ||
| 6760 | +def FuncExtPipes : FunctionExtension<"__opencl_c_pipes">; | ||
| 6761 | +def FuncExtDeviceSidEenqueue : FunctionExtension<"__opencl_c_device_enqueue">; | ||
| 6762 | +def FuncNonExplicitAtomicFeatures : FunctionExtension<"__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device">; | ||
| 6763 | +def FuncNonExplicitAtomicFeaturesAndGenericAS : FunctionExtension<"__opencl_c_atomic_order_seq_cst __opencl_c_atomic_scope_device __opencl_c_generic_address_space">; | ||
| 6764 | + | ||
| 6765 | // Qualified Type. These map to ASTContext::QualType. | ||
| 6766 | class QualType<string _Name, bit _IsAbstract=0> { | ||
| 6767 | // Name of the field or function in a clang::ASTContext | ||
| 6768 | @@ -236,13 +246,9 @@ class Builtin<string _Name, list<Type> _Signature, list<bit> _Attributes = Attr. | ||
| 6769 | bit IsConv = _Attributes[2]; | ||
| 6770 | // OpenCL extensions to which the function belongs. | ||
| 6771 | FunctionExtension Extension = FuncExtNone; | ||
| 6772 | - // Version of OpenCL from which the function is available (e.g.: CL10). | ||
| 6773 | - // MinVersion is inclusive. | ||
| 6774 | - Version MinVersion = CL10; | ||
| 6775 | - // Version of OpenCL from which the function is not supported anymore. | ||
| 6776 | - // MaxVersion is exclusive. | ||
| 6777 | + // List of OpenCL version in which this function available. | ||
| 6778 | // CLAll makes the function available for all versions. | ||
| 6779 | - Version MaxVersion = CLAll; | ||
| 6780 | + list<Version> Versions = [CLAll]; | ||
| 6781 | } | ||
| 6782 | |||
| 6783 | //===----------------------------------------------------------------------===// | ||
| 6784 | @@ -421,7 +427,7 @@ foreach name = ["get_global_size", "get_global_id", "get_local_size", | ||
| 6785 | def : Builtin<name, [Size, UInt], Attr.Const>; | ||
| 6786 | } | ||
| 6787 | |||
| 6788 | -let MinVersion = CL20 in { | ||
| 6789 | +let Versions = [CL20, CL30] in { | ||
| 6790 | def : Builtin<"get_enqueued_local_size", [Size, UInt]>; | ||
| 6791 | foreach name = ["get_global_linear_id", "get_local_linear_id"] in { | ||
| 6792 | def : Builtin<name, [Size]>; | ||
| 6793 | @@ -494,7 +500,7 @@ foreach name = ["fma", "mad"] in { | ||
| 6794 | } | ||
| 6795 | |||
| 6796 | // --- Version dependent --- | ||
| 6797 | -let MaxVersion = CL20 in { | ||
| 6798 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6799 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6800 | foreach name = ["fract", "modf", "sincos"] in { | ||
| 6801 | def : Builtin<name, [FGenTypeN, FGenTypeN, PointerType<FGenTypeN, AS>]>; | ||
| 6802 | @@ -511,7 +517,9 @@ let MaxVersion = CL20 in { | ||
| 6803 | } | ||
| 6804 | } | ||
| 6805 | } | ||
| 6806 | -let MinVersion = CL20 in { | ||
| 6807 | + | ||
| 6808 | +let Versions = [CL20, CL30] in { | ||
| 6809 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6810 | foreach name = ["fract", "modf", "sincos"] in { | ||
| 6811 | def : Builtin<name, [FGenTypeN, FGenTypeN, PointerType<FGenTypeN, GenericAS>]>; | ||
| 6812 | } | ||
| 6813 | @@ -524,6 +532,7 @@ let MinVersion = CL20 in { | ||
| 6814 | def : Builtin<name, [Type, Type, Type, PointerType<GenTypeIntVecAndScalar, GenericAS>]>; | ||
| 6815 | } | ||
| 6816 | } | ||
| 6817 | + } | ||
| 6818 | } | ||
| 6819 | |||
| 6820 | // --- Table 9 --- | ||
| 6821 | @@ -554,7 +563,7 @@ foreach name = ["abs"] in { | ||
| 6822 | foreach name = ["clz", "popcount"] in { | ||
| 6823 | def : Builtin<name, [AIGenTypeN, AIGenTypeN], Attr.Const>; | ||
| 6824 | } | ||
| 6825 | -let MinVersion = CL20 in { | ||
| 6826 | +let Versions = [CL20, CL30] in { | ||
| 6827 | foreach name = ["ctz"] in { | ||
| 6828 | def : Builtin<name, [AIGenTypeN, AIGenTypeN]>; | ||
| 6829 | } | ||
| 6830 | @@ -728,7 +737,7 @@ foreach name = ["select"] in { | ||
| 6831 | // --- Table 15 --- | ||
| 6832 | // Variants for OpenCL versions below 2.0, using pointers to the global, local | ||
| 6833 | // and private address spaces. | ||
| 6834 | -let MaxVersion = CL20 in { | ||
| 6835 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6836 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6837 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6838 | foreach name = ["vload" # VSize] in { | ||
| 6839 | @@ -771,7 +780,8 @@ let MaxVersion = CL20 in { | ||
| 6840 | } | ||
| 6841 | // Variants for OpenCL versions above 2.0, using pointers to the generic | ||
| 6842 | // address space. | ||
| 6843 | -let MinVersion = CL20 in { | ||
| 6844 | +let Versions = [CL20, CL30] in { | ||
| 6845 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6846 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6847 | foreach name = ["vload" # VSize] in { | ||
| 6848 | def : Builtin<name, [VectorType<Char, VSize>, Size, PointerType<ConstType<Char>, GenericAS>]>; | ||
| 6849 | @@ -809,6 +819,7 @@ let MinVersion = CL20 in { | ||
| 6850 | } | ||
| 6851 | } | ||
| 6852 | } | ||
| 6853 | + } | ||
| 6854 | } | ||
| 6855 | // Variants using pointers to the constant address space. | ||
| 6856 | foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6857 | @@ -829,7 +840,7 @@ foreach VSize = [2, 3, 4, 8, 16] in { | ||
| 6858 | def : Builtin<name, [VectorType<Float, VSize>, Size, PointerType<ConstType<Half>, ConstantAS>]>; | ||
| 6859 | } | ||
| 6860 | } | ||
| 6861 | -let MaxVersion = CL20 in { | ||
| 6862 | +let Versions = [CL10, CL11, CL12, CL30] in { | ||
| 6863 | foreach AS = [GlobalAS, LocalAS, PrivateAS] in { | ||
| 6864 | def : Builtin<"vload_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6865 | def : Builtin<"vloada_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6866 | @@ -852,7 +863,8 @@ let MaxVersion = CL20 in { | ||
| 6867 | } | ||
| 6868 | } | ||
| 6869 | } | ||
| 6870 | -let MinVersion = CL20 in { | ||
| 6871 | +let Versions = [CL20, CL30] in { | ||
| 6872 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6873 | foreach AS = [GenericAS] in { | ||
| 6874 | def : Builtin<"vload_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6875 | def : Builtin<"vloada_half", [Float, Size, PointerType<ConstType<Half>, AS>]>; | ||
| 6876 | @@ -874,6 +886,7 @@ let MinVersion = CL20 in { | ||
| 6877 | } | ||
| 6878 | } | ||
| 6879 | } | ||
| 6880 | + } | ||
| 6881 | } | ||
| 6882 | |||
| 6883 | foreach AS = [ConstantAS] in { | ||
| 6884 | @@ -899,7 +912,9 @@ foreach name = ["async_work_group_strided_copy"] in { | ||
| 6885 | def : Builtin<name, [Event, PointerType<AGenTypeN, GlobalAS>, PointerType<ConstType<AGenTypeN>, LocalAS>, Size, Size, Event]>; | ||
| 6886 | } | ||
| 6887 | foreach name = ["wait_group_events"] in { | ||
| 6888 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6889 | def : Builtin<name, [Void, Int, PointerType<Event, GenericAS>]>; | ||
| 6890 | + } | ||
| 6891 | } | ||
| 6892 | foreach name = ["prefetch"] in { | ||
| 6893 | def : Builtin<name, [Void, PointerType<ConstType<AGenTypeN>, GlobalAS>, Size]>; | ||
| 6894 | @@ -1000,13 +1015,25 @@ foreach AS = [GlobalAS, LocalAS] in { | ||
| 6895 | } | ||
| 6896 | } | ||
| 6897 | } | ||
| 6898 | + | ||
| 6899 | // OpenCL v2.0 s6.13.11 - Atomic Functions. | ||
| 6900 | -let MinVersion = CL20 in { | ||
| 6901 | + | ||
| 6902 | +let Versions = [CL20, CL30] in { | ||
| 6903 | + let Extension = FuncExtGenericAddressSpace in { | ||
| 6904 | + foreach TypePair = [[AtomicInt, Int], [AtomicUInt, UInt], | ||
| 6905 | + [AtomicLong, Long], [AtomicULong, ULong], | ||
| 6906 | + [AtomicFloat, Float], [AtomicDouble, Double]] in { | ||
| 6907 | + def : Builtin<"atomic_init", | ||
| 6908 | + [Void, PointerType<VolatileType<TypePair[0]>, GenericAS>, TypePair[1]]>; | ||
| 6909 | + } | ||
| 6910 | + } | ||
| 6911 | +} | ||
| 6912 | + | ||
| 6913 | +let Versions = [CL20, CL30] in { | ||
| 6914 | + let Extension = FuncNonExplicitAtomicFeaturesAndGenericAS in { | ||
| 6915 | foreach TypePair = [[AtomicInt, Int], [AtomicUInt, UInt], | ||
| 6916 | [AtomicLong, Long], [AtomicULong, ULong], | ||
| 6917 | [AtomicFloat, Float], [AtomicDouble, Double]] in { | ||
| 6918 | - def : Builtin<"atomic_init", | ||
| 6919 | - [Void, PointerType<VolatileType<TypePair[0]>, GenericAS>, TypePair[1]]>; | ||
| 6920 | def : Builtin<"atomic_store", | ||
| 6921 | [Void, PointerType<VolatileType<TypePair[0]>, GenericAS>, TypePair[1]]>; | ||
| 6922 | def : Builtin<"atomic_load", | ||
| 6923 | @@ -1038,6 +1065,59 @@ let MinVersion = CL20 in { | ||
| 6924 | [TypePair[1], PointerType<VolatileType<TypePair[0]>, GenericAS>, TypePair[2]]>; | ||
| 6925 | } | ||
| 6926 | } | ||
| 6927 | + } | ||
| 6928 | +} | ||
| 6929 | + | ||
| 6930 | +let Versions = [CL30] in { | ||
| 6931 | + foreach AS = [GlobalAS, LocalAS] in { | ||
| 6932 | + foreach TypePair = [[AtomicInt, Int], [AtomicUInt, UInt], | ||
| 6933 | + [AtomicLong, Long], [AtomicULong, ULong], | ||
| 6934 | + [AtomicFloat, Float], [AtomicDouble, Double]] in { | ||
| 6935 | + def : Builtin<"atomic_init", | ||
| 6936 | + [Void, PointerType<VolatileType<TypePair[0]>, AS>, TypePair[1]]>; | ||
| 6937 | + } | ||
| 6938 | + } | ||
| 6939 | +} | ||
| 6940 | + | ||
| 6941 | +let Versions = [CL30] in { | ||
| 6942 | + let Extension = FuncNonExplicitAtomicFeatures in { | ||
| 6943 | + foreach AS = [GlobalAS, LocalAS] in { | ||
| 6944 | + foreach TypePair = [[AtomicInt, Int], [AtomicUInt, UInt], | ||
| 6945 | + [AtomicLong, Long], [AtomicULong, ULong], | ||
| 6946 | + [AtomicFloat, Float], [AtomicDouble, Double]] in { | ||
| 6947 | + def : Builtin<"atomic_store", | ||
| 6948 | + [Void, PointerType<VolatileType<TypePair[0]>, AS>, TypePair[1]]>; | ||
| 6949 | + def : Builtin<"atomic_load", | ||
| 6950 | + [TypePair[1], PointerType<VolatileType<TypePair[0]>, AS>]>; | ||
| 6951 | + def : Builtin<"atomic_exchange", | ||
| 6952 | + [TypePair[1], PointerType<VolatileType<TypePair[0]>, AS>, TypePair[1]]>; | ||
| 6953 | + foreach Variant = ["weak", "strong"] in { | ||
| 6954 | + def : Builtin<"atomic_compare_exchange_" # Variant, | ||
| 6955 | + [Bool, PointerType<VolatileType<TypePair[0]>, AS>, | ||
| 6956 | + PointerType<TypePair[1], AS>, TypePair[1]]>; | ||
| 6957 | + } | ||
| 6958 | + } | ||
| 6959 | + | ||
| 6960 | + foreach TypePair = [[AtomicInt, Int, Int], [AtomicUInt, UInt, UInt], | ||
| 6961 | + [AtomicLong, Long, Long], [AtomicULong, ULong, ULong], | ||
| 6962 | + [AtomicIntPtr, IntPtr, PtrDiff], | ||
| 6963 | + [AtomicUIntPtr, UIntPtr, PtrDiff]] in { | ||
| 6964 | + foreach ModOp = ["add", "sub"] in { | ||
| 6965 | + def : Builtin<"atomic_fetch_" # ModOp, | ||
| 6966 | + [TypePair[1], PointerType<VolatileType<TypePair[0]>, AS>, TypePair[2]]>; | ||
| 6967 | + } | ||
| 6968 | + } | ||
| 6969 | + foreach TypePair = [[AtomicInt, Int, Int], [AtomicUInt, UInt, UInt], | ||
| 6970 | + [AtomicLong, Long, Long], [AtomicULong, ULong, ULong], | ||
| 6971 | + [AtomicIntPtr, IntPtr, IntPtr], | ||
| 6972 | + [AtomicUIntPtr, UIntPtr, UIntPtr]] in { | ||
| 6973 | + foreach ModOp = ["or", "xor", "and", "min", "max"] in { | ||
| 6974 | + def : Builtin<"atomic_fetch_" # ModOp, | ||
| 6975 | + [TypePair[1], PointerType<VolatileType<TypePair[0]>, AS>, TypePair[2]]>; | ||
| 6976 | + } | ||
| 6977 | + } | ||
| 6978 | + } | ||
| 6979 | + } | ||
| 6980 | } | ||
| 6981 | |||
| 6982 | //-------------------------------------------------------------------- | ||
| 6983 | @@ -1217,7 +1297,8 @@ foreach aQual = ["WO", "RW"] in { | ||
| 6984 | //-------------------------------------------------------------------- | ||
| 6985 | // OpenCL v2.0 s6.13.15 - Work-group Functions | ||
| 6986 | // --- Table 26 --- | ||
| 6987 | -let MinVersion = CL20 in { | ||
| 6988 | +let Versions = [CL20, CL30] in { | ||
| 6989 | + let Extension = FuncExtWorkGroupCollective in { | ||
| 6990 | foreach name = ["work_group_all", "work_group_any"] in { | ||
| 6991 | def : Builtin<name, [Int, Int], Attr.Convergent>; | ||
| 6992 | } | ||
| 6993 | @@ -1232,6 +1313,7 @@ let MinVersion = CL20 in { | ||
| 6994 | def : Builtin<name # op, [IntLongFloatGenType1, IntLongFloatGenType1], Attr.Convergent>; | ||
| 6995 | } | ||
| 6996 | } | ||
| 6997 | + } | ||
| 6998 | } | ||
| 6999 | |||
| 7000 | |||
| 7001 | @@ -1241,8 +1323,10 @@ let MinVersion = CL20 in { | ||
| 7002 | // Defined in Builtins.def | ||
| 7003 | |||
| 7004 | // --- Table 28 --- | ||
| 7005 | -// Builtins taking pipe arguments are defined in Builtins.def | ||
| 7006 | -def : Builtin<"is_valid_reserve_id", [Bool, ReserveId]>; | ||
| 7007 | +let Extension = FuncExtPipes in { | ||
| 7008 | + // Builtins taking pipe arguments are defined in Builtins.def | ||
| 7009 | + def : Builtin<"is_valid_reserve_id", [Bool, ReserveId]>; | ||
| 7010 | +} | ||
| 7011 | |||
| 7012 | // --- Table 29 --- | ||
| 7013 | // Defined in Builtins.def | ||
| 7014 | @@ -1257,21 +1341,22 @@ def : Builtin<"is_valid_reserve_id", [Bool, ReserveId]>; | ||
| 7015 | // Defined in Builtins.def | ||
| 7016 | |||
| 7017 | // --- Table 33 --- | ||
| 7018 | -def : Builtin<"enqueue_marker", | ||
| 7019 | - [Int, Queue, UInt, PointerType<ConstType<ClkEvent>, GenericAS>, PointerType<ClkEvent, GenericAS>]>; | ||
| 7020 | +let Extension = FuncExtDeviceSidEenqueue in { | ||
| 7021 | + def : Builtin<"enqueue_marker", | ||
| 7022 | + [Int, Queue, UInt, PointerType<ConstType<ClkEvent>, GenericAS>, PointerType<ClkEvent, GenericAS>]>; | ||
| 7023 | |||
| 7024 | -// --- Table 34 --- | ||
| 7025 | -def : Builtin<"retain_event", [Void, ClkEvent]>; | ||
| 7026 | -def : Builtin<"release_event", [Void, ClkEvent]>; | ||
| 7027 | -def : Builtin<"create_user_event", [ClkEvent]>; | ||
| 7028 | -def : Builtin<"is_valid_event", [Bool, ClkEvent]>; | ||
| 7029 | -def : Builtin<"set_user_event_status", [Void, ClkEvent, Int]>; | ||
| 7030 | -// TODO: capture_event_profiling_info | ||
| 7031 | - | ||
| 7032 | -// --- Table 35 --- | ||
| 7033 | -def : Builtin<"get_default_queue", [Queue]>; | ||
| 7034 | -// TODO: ndrange functions | ||
| 7035 | + // --- Table 34 --- | ||
| 7036 | + def : Builtin<"retain_event", [Void, ClkEvent]>; | ||
| 7037 | + def : Builtin<"release_event", [Void, ClkEvent]>; | ||
| 7038 | + def : Builtin<"create_user_event", [ClkEvent]>; | ||
| 7039 | + def : Builtin<"is_valid_event", [Bool, ClkEvent]>; | ||
| 7040 | + def : Builtin<"set_user_event_status", [Void, ClkEvent, Int]>; | ||
| 7041 | + // TODO: capture_event_profiling_info | ||
| 7042 | |||
| 7043 | + // --- Table 35 --- | ||
| 7044 | + def : Builtin<"get_default_queue", [Queue]>; | ||
| 7045 | + // TODO: ndrange functions | ||
| 7046 | +} | ||
| 7047 | |||
| 7048 | //-------------------------------------------------------------------- | ||
| 7049 | // End of the builtin functions defined in the OpenCL C specification. | ||
| 7050 | @@ -1456,7 +1541,7 @@ let Extension = FuncExtKhrSubgroups in { | ||
| 7051 | "get_sub_group_local_id"] in { | ||
| 7052 | def : Builtin<name, [UInt]>; | ||
| 7053 | } | ||
| 7054 | - let MinVersion = CL20 in { | ||
| 7055 | + let Versions = [CL20] in { | ||
| 7056 | foreach name = ["get_enqueued_num_sub_groups"] in { | ||
| 7057 | def : Builtin<name, [UInt]>; | ||
| 7058 | } | ||
| 7059 | diff --git a/clang/lib/Sema/Sema.cpp b/clang/lib/Sema/Sema.cpp | ||
| 7060 | index 2f2b52106f3d..5092a4691b9b 100644 | ||
| 7061 | --- a/clang/lib/Sema/Sema.cpp | ||
| 7062 | +++ b/clang/lib/Sema/Sema.cpp | ||
| 7063 | @@ -291,9 +291,10 @@ void Sema::Initialize() { | ||
| 7064 | // Initialize predefined OpenCL types and supported extensions and (optional) | ||
| 7065 | // core features. | ||
| 7066 | if (getLangOpts().OpenCL) { | ||
| 7067 | + getOpenCLOptions().setOpenCLVersion(getLangOpts()); | ||
| 7068 | getOpenCLOptions().addSupport( | ||
| 7069 | Context.getTargetInfo().getSupportedOpenCLOpts()); | ||
| 7070 | - getOpenCLOptions().enableSupportedCore(getLangOpts()); | ||
| 7071 | + getOpenCLOptions().enableSupportedCore(); | ||
| 7072 | addImplicitTypedef("sampler_t", Context.OCLSamplerTy); | ||
| 7073 | addImplicitTypedef("event_t", Context.OCLEventTy); | ||
| 7074 | if (getLangOpts().OpenCLCPlusPlus || getLangOpts().OpenCLVersion >= 200) { | ||
| 7075 | @@ -349,12 +350,18 @@ void Sema::Initialize() { | ||
| 7076 | "cl_khr_int64_base_atomics cl_khr_int64_extended_atomics"); | ||
| 7077 | |||
| 7078 | setOpenCLExtensionForType(AtomicDoubleT, "cl_khr_fp64"); | ||
| 7079 | + setOpenCLExtensionForType(Context.OCLReserveIDTy, "__opencl_c_pipes"); | ||
| 7080 | + setOpenCLExtensionForType(Context.OCLClkEventTy, | ||
| 7081 | + "__opencl_c_device_enqueue"); | ||
| 7082 | + setOpenCLExtensionForType(Context.OCLQueueTy, | ||
| 7083 | + "__opencl_c_device_enqueue"); | ||
| 7084 | } | ||
| 7085 | |||
| 7086 | setOpenCLExtensionForType(Context.DoubleTy, "cl_khr_fp64"); | ||
| 7087 | |||
| 7088 | -#define GENERIC_IMAGE_TYPE_EXT(Type, Id, Ext) \ | ||
| 7089 | - setOpenCLExtensionForType(Context.Id, Ext); | ||
| 7090 | +#define GENERIC_IMAGE_TYPE_EXT(Type, Id, Ext) \ | ||
| 7091 | + setOpenCLExtensionForType(Context.Id, Ext); \ | ||
| 7092 | + setOpenCLExtensionForType(Context.Id, "__opencl_c_images"); | ||
| 7093 | #include "clang/Basic/OpenCLImageTypes.def" | ||
| 7094 | #define EXT_OPAQUE_TYPE(ExtType, Id, Ext) \ | ||
| 7095 | addImplicitTypedef(#ExtType, Context.Id##Ty); \ | ||
| 7096 | @@ -2423,6 +2430,27 @@ bool Sema::isOpenCLDisabledDecl(Decl *FD) { | ||
| 7097 | return false; | ||
| 7098 | } | ||
| 7099 | |||
| 7100 | +template <typename DiagLocT, typename DiagInfoT> | ||
| 7101 | +void Sema::DiagnoseOpenCLRequiresOption(llvm::StringRef OpenCLOptName, | ||
| 7102 | + DiagLocT DiagLoc, DiagInfoT DiagInfo, | ||
| 7103 | + unsigned Selector, | ||
| 7104 | + SourceRange SrcRange) { | ||
| 7105 | + const auto &LO = getLangOpts(); | ||
| 7106 | + auto CLVer = LO.OpenCLCPlusPlus ? 200 : LO.OpenCLVersion; | ||
| 7107 | + // For versions higher that 3.0 diagnosing feature | ||
| 7108 | + if (CLVer >= 300) { | ||
| 7109 | + OpenCLOptName = | ||
| 7110 | + llvm::StringSwitch<llvm::StringRef>(OpenCLOptName) | ||
| 7111 | + .Case("cl_khr_3d_image_writes", "__opencl_c_3d_image_writes") | ||
| 7112 | + .Case("cl_khr_subgroups", "__opencl_c_subgroups") | ||
| 7113 | + .Case("cl_khr_fp64", "__opencl_c_fp64") | ||
| 7114 | + .Default(OpenCLOptName); | ||
| 7115 | + } | ||
| 7116 | + | ||
| 7117 | + Diag(DiagLoc, diag::err_opencl_requires_extension) | ||
| 7118 | + << Selector << DiagInfo << OpenCLOptName << SrcRange; | ||
| 7119 | +} | ||
| 7120 | + | ||
| 7121 | template <typename T, typename DiagLocT, typename DiagInfoT, typename MapT> | ||
| 7122 | bool Sema::checkOpenCLDisabledTypeOrDecl(T D, DiagLocT DiagLoc, | ||
| 7123 | DiagInfoT DiagInfo, MapT &Map, | ||
| 7124 | @@ -2434,8 +2462,7 @@ bool Sema::checkOpenCLDisabledTypeOrDecl(T D, DiagLocT DiagLoc, | ||
| 7125 | bool Disabled = false; | ||
| 7126 | for (auto &I : Loc->second) { | ||
| 7127 | if (I != CurrOpenCLExtension && !getOpenCLOptions().isEnabled(I)) { | ||
| 7128 | - Diag(DiagLoc, diag::err_opencl_requires_extension) << Selector << DiagInfo | ||
| 7129 | - << I << SrcRange; | ||
| 7130 | + DiagnoseOpenCLRequiresOption(I, DiagLoc, DiagInfo, Selector, SrcRange); | ||
| 7131 | Disabled = true; | ||
| 7132 | } | ||
| 7133 | } | ||
| 7134 | @@ -2471,3 +2498,13 @@ bool Sema::checkOpenCLDisabledDecl(const NamedDecl &D, const Expr &E) { | ||
| 7135 | return checkOpenCLDisabledTypeOrDecl(&D, E.getBeginLoc(), FnName, | ||
| 7136 | OpenCLDeclExtMap, 1, D.getSourceRange()); | ||
| 7137 | } | ||
| 7138 | + | ||
| 7139 | +bool Sema::checkOpenCLSubgroupExtForCallExpr(CallExpr *Call) { | ||
| 7140 | + if (!getOpenCLOptions().isEnabled("cl_khr_subgroups")) { | ||
| 7141 | + DiagnoseOpenCLRequiresOption("cl_khr_subgroups", Call->getBeginLoc(), | ||
| 7142 | + Call->getDirectCallee(), 1, | ||
| 7143 | + Call->getSourceRange()); | ||
| 7144 | + return true; | ||
| 7145 | + } | ||
| 7146 | + return false; | ||
| 7147 | +} | ||
| 7148 | diff --git a/clang/lib/Sema/SemaChecking.cpp b/clang/lib/Sema/SemaChecking.cpp | ||
| 7149 | index 1bf04d9cb4f2..9dd63db0f420 100644 | ||
| 7150 | --- a/clang/lib/Sema/SemaChecking.cpp | ||
| 7151 | +++ b/clang/lib/Sema/SemaChecking.cpp | ||
| 7152 | @@ -835,20 +835,11 @@ static bool checkOpenCLBlockArgs(Sema &S, Expr *BlockArg) { | ||
| 7153 | return IllegalParams; | ||
| 7154 | } | ||
| 7155 | |||
| 7156 | -static bool checkOpenCLSubgroupExt(Sema &S, CallExpr *Call) { | ||
| 7157 | - if (!S.getOpenCLOptions().isEnabled("cl_khr_subgroups")) { | ||
| 7158 | - S.Diag(Call->getBeginLoc(), diag::err_opencl_requires_extension) | ||
| 7159 | - << 1 << Call->getDirectCallee() << "cl_khr_subgroups"; | ||
| 7160 | - return true; | ||
| 7161 | - } | ||
| 7162 | - return false; | ||
| 7163 | -} | ||
| 7164 | - | ||
| 7165 | static bool SemaOpenCLBuiltinNDRangeAndBlock(Sema &S, CallExpr *TheCall) { | ||
| 7166 | if (checkArgCount(S, TheCall, 2)) | ||
| 7167 | return true; | ||
| 7168 | |||
| 7169 | - if (checkOpenCLSubgroupExt(S, TheCall)) | ||
| 7170 | + if (S.checkOpenCLSubgroupExtForCallExpr(TheCall)) | ||
| 7171 | return true; | ||
| 7172 | |||
| 7173 | // First argument is an ndrange_t type. | ||
| 7174 | @@ -1883,7 +1874,7 @@ Sema::CheckBuiltinFunctionCall(FunctionDecl *FDecl, unsigned BuiltinID, | ||
| 7175 | break; | ||
| 7176 | case Builtin::BIsub_group_reserve_read_pipe: | ||
| 7177 | case Builtin::BIsub_group_reserve_write_pipe: | ||
| 7178 | - if (checkOpenCLSubgroupExt(*this, TheCall) || | ||
| 7179 | + if (checkOpenCLSubgroupExtForCallExpr(TheCall) || | ||
| 7180 | SemaBuiltinReserveRWPipe(*this, TheCall)) | ||
| 7181 | return ExprError(); | ||
| 7182 | break; | ||
| 7183 | @@ -1896,7 +1887,7 @@ Sema::CheckBuiltinFunctionCall(FunctionDecl *FDecl, unsigned BuiltinID, | ||
| 7184 | break; | ||
| 7185 | case Builtin::BIsub_group_commit_read_pipe: | ||
| 7186 | case Builtin::BIsub_group_commit_write_pipe: | ||
| 7187 | - if (checkOpenCLSubgroupExt(*this, TheCall) || | ||
| 7188 | + if (checkOpenCLSubgroupExtForCallExpr(TheCall) || | ||
| 7189 | SemaBuiltinCommitRWPipe(*this, TheCall)) | ||
| 7190 | return ExprError(); | ||
| 7191 | break; | ||
| 7192 | @@ -4149,6 +4140,20 @@ DiagnoseCStringFormatDirectiveInCFAPI(Sema &S, | ||
| 7193 | } | ||
| 7194 | } | ||
| 7195 | |||
| 7196 | +bool Sema::isSupportedOpenCLOMemoryOrdering(int64_t Ordering) const { | ||
| 7197 | + assert(llvm::isValidAtomicOrderingCABI(Ordering)); | ||
| 7198 | + auto OrderingCABI = (llvm::AtomicOrderingCABI)Ordering; | ||
| 7199 | + switch (OrderingCABI) { | ||
| 7200 | + case llvm::AtomicOrderingCABI::acquire: | ||
| 7201 | + case llvm::AtomicOrderingCABI::release: | ||
| 7202 | + case llvm::AtomicOrderingCABI::acq_rel: | ||
| 7203 | + return OpenCLFeatures.isEnabled("__opencl_c_atomic_order_acq_rel"); | ||
| 7204 | + | ||
| 7205 | + default: | ||
| 7206 | + return true; | ||
| 7207 | + } | ||
| 7208 | +} | ||
| 7209 | + | ||
| 7210 | /// Determine whether the given type has a non-null nullability annotation. | ||
| 7211 | static bool isNonNullType(ASTContext &ctx, QualType type) { | ||
| 7212 | if (auto nullability = type->getNullability(ctx)) | ||
| 7213 | @@ -4920,10 +4925,17 @@ ExprResult Sema::BuildAtomicExpr(SourceRange CallRange, SourceRange ExprRange, | ||
| 7214 | if (SubExprs.size() >= 2 && Form != Init) { | ||
| 7215 | llvm::APSInt Result(32); | ||
| 7216 | if (SubExprs[1]->isIntegerConstantExpr(Result, Context) && | ||
| 7217 | - !isValidOrderingForOp(Result.getSExtValue(), Op)) | ||
| 7218 | + !isValidOrderingForOp(Result.getSExtValue(), Op)) { | ||
| 7219 | Diag(SubExprs[1]->getBeginLoc(), | ||
| 7220 | diag::warn_atomic_op_has_invalid_memory_order) | ||
| 7221 | << SubExprs[1]->getSourceRange(); | ||
| 7222 | + } else if (IsOpenCL && | ||
| 7223 | + !isSupportedOpenCLOMemoryOrdering(Result.getSExtValue())) { | ||
| 7224 | + Diag(SubExprs[1]->getBeginLoc(), | ||
| 7225 | + diag::err_opencl_memory_ordering_require_feat) | ||
| 7226 | + << SubExprs[1]->getSourceRange(); | ||
| 7227 | + return ExprError(); | ||
| 7228 | + } | ||
| 7229 | } | ||
| 7230 | |||
| 7231 | if (auto ScopeModel = AtomicExpr::getScopeModel(Op)) { | ||
| 7232 | diff --git a/clang/lib/Sema/SemaDecl.cpp b/clang/lib/Sema/SemaDecl.cpp | ||
| 7233 | index 5b0417fa8859..2dee60763d57 100644 | ||
| 7234 | --- a/clang/lib/Sema/SemaDecl.cpp | ||
| 7235 | +++ b/clang/lib/Sema/SemaDecl.cpp | ||
| 7236 | @@ -6290,7 +6290,9 @@ void Sema::deduceOpenCLAddressSpace(ValueDecl *Decl) { | ||
| 7237 | if (Type->isSamplerT() || Type->isVoidType()) | ||
| 7238 | return; | ||
| 7239 | LangAS ImplAS = LangAS::opencl_private; | ||
| 7240 | - if ((getLangOpts().OpenCLCPlusPlus || getLangOpts().OpenCLVersion >= 200) && | ||
| 7241 | + if ((getLangOpts().OpenCLCPlusPlus || | ||
| 7242 | + getOpenCLOptions().isEnabled( | ||
| 7243 | + "__opencl_c_program_scope_global_variables")) && | ||
| 7244 | Var->hasGlobalStorage()) | ||
| 7245 | ImplAS = LangAS::opencl_global; | ||
| 7246 | // If the original type from a decayed type is an array type and that array | ||
| 7247 | @@ -7849,18 +7851,22 @@ void Sema::CheckVariableDeclarationType(VarDecl *NewVD) { | ||
| 7248 | // OpenCL C v2.0 s6.5.1 - Variables defined at program scope and static | ||
| 7249 | // variables inside a function can also be declared in the global | ||
| 7250 | // address space. | ||
| 7251 | + // OpenCL C v3.0 s5.5 - For OpenCL C 2.0, or with the | ||
| 7252 | + // __opencl_c_program_scope_global_variables feature macro, the | ||
| 7253 | + // address space for a variable at program scope or a static variable | ||
| 7254 | + // also be __global | ||
| 7255 | // C++ for OpenCL inherits rule from OpenCL C v2.0. | ||
| 7256 | // FIXME: Adding local AS in C++ for OpenCL might make sense. | ||
| 7257 | if (NewVD->isFileVarDecl() || NewVD->isStaticLocal() || | ||
| 7258 | NewVD->hasExternalStorage()) { | ||
| 7259 | - if (!T->isSamplerT() && | ||
| 7260 | - !T->isDependentType() && | ||
| 7261 | + if (!T->isSamplerT() && !T->isDependentType() && | ||
| 7262 | !(T.getAddressSpace() == LangAS::opencl_constant || | ||
| 7263 | (T.getAddressSpace() == LangAS::opencl_global && | ||
| 7264 | - (getLangOpts().OpenCLVersion == 200 || | ||
| 7265 | - getLangOpts().OpenCLCPlusPlus)))) { | ||
| 7266 | + (OpenCLFeatures.isEnabled( | ||
| 7267 | + "__opencl_c_program_scope_global_variables"))))) { | ||
| 7268 | int Scope = NewVD->isStaticLocal() | NewVD->hasExternalStorage() << 1; | ||
| 7269 | - if (getLangOpts().OpenCLVersion == 200 || getLangOpts().OpenCLCPlusPlus) | ||
| 7270 | + if (OpenCLFeatures.isEnabled( | ||
| 7271 | + "__opencl_c_program_scope_global_variables")) | ||
| 7272 | Diag(NewVD->getLocation(), diag::err_opencl_global_invalid_addr_space) | ||
| 7273 | << Scope << "global or constant"; | ||
| 7274 | else | ||
| 7275 | diff --git a/clang/lib/Sema/SemaDeclAttr.cpp b/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7276 | index a9a2a19b4797..73b35eae176a 100644 | ||
| 7277 | --- a/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7278 | +++ b/clang/lib/Sema/SemaDeclAttr.cpp | ||
| 7279 | @@ -6488,7 +6488,7 @@ static void handleInternalLinkageAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7280 | } | ||
| 7281 | |||
| 7282 | static void handleOpenCLNoSVMAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7283 | - if (S.LangOpts.OpenCLVersion != 200) | ||
| 7284 | + if (S.LangOpts.OpenCLVersion < 200) | ||
| 7285 | S.Diag(AL.getLoc(), diag::err_attribute_requires_opencl_version) | ||
| 7286 | << AL << "2.0" << 0; | ||
| 7287 | else | ||
| 7288 | @@ -6572,6 +6572,13 @@ static void handleOpenCLAccessAttr(Sema &S, Decl *D, const ParsedAttr &AL) { | ||
| 7289 | << AL << PDecl->getType() << DeclTy->isImageType(); | ||
| 7290 | D->setInvalidDecl(true); | ||
| 7291 | return; | ||
| 7292 | + } else if ((!S.getLangOpts().OpenCLCPlusPlus && | ||
| 7293 | + S.getLangOpts().OpenCLVersion >= 200) && | ||
| 7294 | + !S.getOpenCLOptions().isEnabled( | ||
| 7295 | + "__opencl_c_read_write_images")) { | ||
| 7296 | + S.Diag(AL.getLoc(), diag::err_opencl_requires_extension) | ||
| 7297 | + << 0 << PDecl->getType() << "__opencl_c_read_write_images"; | ||
| 7298 | + return; | ||
| 7299 | } | ||
| 7300 | } | ||
| 7301 | } | ||
| 7302 | diff --git a/clang/lib/Sema/SemaDeclCXX.cpp b/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7303 | index 22bf35dbd0cb..b2081bb6b407 100644 | ||
| 7304 | --- a/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7305 | +++ b/clang/lib/Sema/SemaDeclCXX.cpp | ||
| 7306 | @@ -38,9 +38,9 @@ | ||
| 7307 | #include "clang/Sema/ScopeInfo.h" | ||
| 7308 | #include "clang/Sema/SemaInternal.h" | ||
| 7309 | #include "clang/Sema/Template.h" | ||
| 7310 | +#include "llvm/ADT/STLExtras.h" | ||
| 7311 | #include "llvm/ADT/ScopeExit.h" | ||
| 7312 | #include "llvm/ADT/SmallString.h" | ||
| 7313 | -#include "llvm/ADT/STLExtras.h" | ||
| 7314 | #include "llvm/ADT/StringExtras.h" | ||
| 7315 | #include <map> | ||
| 7316 | #include <set> | ||
| 7317 | @@ -15228,6 +15228,11 @@ CheckOperatorNewDeleteTypes(Sema &SemaRef, const FunctionDecl *FnDecl, | ||
| 7318 | if (auto *PtrTy = ResultType->getAs<PointerType>()) { | ||
| 7319 | ResultType = RemoveAddressSpaceFromPtr(SemaRef, PtrTy); | ||
| 7320 | } | ||
| 7321 | + if (CanQual<PointerType> ExpectedPtrTy = | ||
| 7322 | + ExpectedResultType->getAs<PointerType>()) { | ||
| 7323 | + ExpectedResultType = SemaRef.Context.getCanonicalType( | ||
| 7324 | + RemoveAddressSpaceFromPtr(SemaRef, ExpectedPtrTy->getTypePtr())); | ||
| 7325 | + } | ||
| 7326 | } | ||
| 7327 | |||
| 7328 | // Check that the result type is what we expect. | ||
| 7329 | @@ -15261,6 +15266,11 @@ CheckOperatorNewDeleteTypes(Sema &SemaRef, const FunctionDecl *FnDecl, | ||
| 7330 | FnDecl->getParamDecl(0)->getType()->getAs<PointerType>()) { | ||
| 7331 | FirstParamType = RemoveAddressSpaceFromPtr(SemaRef, PtrTy); | ||
| 7332 | } | ||
| 7333 | + if (CanQual<PointerType> ExpectedPtrTy = | ||
| 7334 | + ExpectedFirstParamType->getAs<PointerType>()) { | ||
| 7335 | + ExpectedFirstParamType = SemaRef.Context.getCanonicalType( | ||
| 7336 | + RemoveAddressSpaceFromPtr(SemaRef, ExpectedPtrTy->getTypePtr())); | ||
| 7337 | + } | ||
| 7338 | } | ||
| 7339 | |||
| 7340 | // Check that the first parameter type is what we expect. | ||
| 7341 | diff --git a/clang/lib/Sema/SemaLookup.cpp b/clang/lib/Sema/SemaLookup.cpp | ||
| 7342 | index bcbecd545398..40eaebbc9495 100644 | ||
| 7343 | --- a/clang/lib/Sema/SemaLookup.cpp | ||
| 7344 | +++ b/clang/lib/Sema/SemaLookup.cpp | ||
| 7345 | @@ -775,19 +775,20 @@ static void InsertOCLBuiltinDeclarationsFromTable(Sema &S, LookupResult &LR, | ||
| 7346 | // as argument. Only meaningful for generic types, otherwise equals 1. | ||
| 7347 | unsigned GenTypeMaxCnt; | ||
| 7348 | |||
| 7349 | + ASTContext &Context = S.Context; | ||
| 7350 | + | ||
| 7351 | + // Ignore this BIF if its version does not match the language options. | ||
| 7352 | + unsigned OpenCLVersion = Context.getLangOpts().OpenCLVersion; | ||
| 7353 | + if (Context.getLangOpts().OpenCLCPlusPlus) | ||
| 7354 | + OpenCLVersion = 200; | ||
| 7355 | + | ||
| 7356 | + unsigned short VersionCode = OpenCLOptions::EncodeVersion(OpenCLVersion); | ||
| 7357 | + | ||
| 7358 | for (unsigned SignatureIndex = 0; SignatureIndex < Len; SignatureIndex++) { | ||
| 7359 | const OpenCLBuiltinStruct &OpenCLBuiltin = | ||
| 7360 | BuiltinTable[FctIndex + SignatureIndex]; | ||
| 7361 | - ASTContext &Context = S.Context; | ||
| 7362 | |||
| 7363 | - // Ignore this BIF if its version does not match the language options. | ||
| 7364 | - unsigned OpenCLVersion = Context.getLangOpts().OpenCLVersion; | ||
| 7365 | - if (Context.getLangOpts().OpenCLCPlusPlus) | ||
| 7366 | - OpenCLVersion = 200; | ||
| 7367 | - if (OpenCLVersion < OpenCLBuiltin.MinVersion) | ||
| 7368 | - continue; | ||
| 7369 | - if ((OpenCLBuiltin.MaxVersion != 0) && | ||
| 7370 | - (OpenCLVersion >= OpenCLBuiltin.MaxVersion)) | ||
| 7371 | + if (!(OpenCLBuiltin.AllVersions & VersionCode)) | ||
| 7372 | continue; | ||
| 7373 | |||
| 7374 | SmallVector<QualType, 1> RetTypes; | ||
| 7375 | diff --git a/clang/lib/Sema/SemaType.cpp b/clang/lib/Sema/SemaType.cpp | ||
| 7376 | index cc151a048b98..f380a5656a57 100644 | ||
| 7377 | --- a/clang/lib/Sema/SemaType.cpp | ||
| 7378 | +++ b/clang/lib/Sema/SemaType.cpp | ||
| 7379 | @@ -2042,7 +2042,7 @@ static QualType deduceOpenCLPointeeAddrSpace(Sema &S, QualType PointeeType) { | ||
| 7380 | !PointeeType.hasAddressSpace()) | ||
| 7381 | PointeeType = S.getASTContext().getAddrSpaceQualType( | ||
| 7382 | PointeeType, | ||
| 7383 | - S.getLangOpts().OpenCLCPlusPlus || S.getLangOpts().OpenCLVersion == 200 | ||
| 7384 | + S.getOpenCLOptions().isEnabled("__opencl_c_generic_address_space") | ||
| 7385 | ? LangAS::opencl_generic | ||
| 7386 | : LangAS::opencl_private); | ||
| 7387 | return PointeeType; | ||
| 7388 | @@ -5316,9 +5316,15 @@ static TypeSourceInfo *GetFullTypeForDeclarator(TypeProcessingState &state, | ||
| 7389 | } | ||
| 7390 | |||
| 7391 | case DeclaratorChunk::Pipe: { | ||
| 7392 | - T = S.BuildReadPipeType(T, DeclType.Loc); | ||
| 7393 | - processTypeAttrs(state, T, TAL_DeclSpec, | ||
| 7394 | - D.getMutableDeclSpec().getAttributes()); | ||
| 7395 | + if (S.getOpenCLOptions().isEnabled("__opencl_c_pipes")) { | ||
| 7396 | + T = S.BuildReadPipeType(T, DeclType.Loc); | ||
| 7397 | + processTypeAttrs(state, T, TAL_DeclSpec, | ||
| 7398 | + D.getMutableDeclSpec().getAttributes()); | ||
| 7399 | + } else { | ||
| 7400 | + D.setInvalidType(true); | ||
| 7401 | + T = Context.IntTy; | ||
| 7402 | + S.Diag(D.getIdentifierLoc(), diag::err_opencl_pipes_require_feat); | ||
| 7403 | + } | ||
| 7404 | break; | ||
| 7405 | } | ||
| 7406 | } | ||
| 7407 | diff --git a/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl b/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7408 | index e1f3f6fe1419..b43d9df5935c 100644 | ||
| 7409 | --- a/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7410 | +++ b/clang/test/CodeGenOpenCL/addr-space-struct-arg.cl | ||
| 7411 | @@ -2,7 +2,8 @@ | ||
| 7412 | // RUN: %clang_cc1 %s -emit-llvm -o - -O0 -triple amdgcn | FileCheck -enable-var-scope -check-prefixes=ALL,AMDGCN %s | ||
| 7413 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL2.0 -O0 -triple amdgcn | FileCheck -enable-var-scope -check-prefixes=ALL,AMDGCN,AMDGCN20 %s | ||
| 7414 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL1.2 -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7415 | - | ||
| 7416 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7417 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -cl-ext=__opencl_c_program_scope_global_variables -O0 -triple spir-unknown-unknown-unknown | FileCheck -enable-var-scope -check-prefixes=SPIR %s | ||
| 7418 | typedef int int2 __attribute__((ext_vector_type(2))); | ||
| 7419 | |||
| 7420 | typedef struct { | ||
| 7421 | @@ -39,7 +40,7 @@ struct LargeStructTwoMember { | ||
| 7422 | int2 y[20]; | ||
| 7423 | }; | ||
| 7424 | |||
| 7425 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7426 | +#ifdef __opencl_c_program_scope_global_variables | ||
| 7427 | struct LargeStructOneMember g_s; | ||
| 7428 | #endif | ||
| 7429 | |||
| 7430 | @@ -98,7 +99,7 @@ void FuncOneLargeMember(struct LargeStructOneMember u) { | ||
| 7431 | // AMDGCN20: %[[r0:.*]] = bitcast %struct.LargeStructOneMember addrspace(5)* %[[byval_temp]] to i8 addrspace(5)* | ||
| 7432 | // AMDGCN20: call void @llvm.memcpy.p5i8.p1i8.i64(i8 addrspace(5)* align 8 %[[r0]], i8 addrspace(1)* align 8 bitcast (%struct.LargeStructOneMember addrspace(1)* @g_s to i8 addrspace(1)*), i64 800, i1 false) | ||
| 7433 | // AMDGCN20: call void @FuncOneLargeMember(%struct.LargeStructOneMember addrspace(5)* byval(%struct.LargeStructOneMember) align 8 %[[byval_temp]]) | ||
| 7434 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7435 | +#ifdef __opencl_c_program_scope_global_variables | ||
| 7436 | void test_indirect_arg_globl(void) { | ||
| 7437 | FuncOneLargeMember(g_s); | ||
| 7438 | } | ||
| 7439 | diff --git a/clang/test/CodeGenOpenCL/address-spaces-conversions.cl b/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7440 | index 52feccc540bb..9ecffcca5ee9 100644 | ||
| 7441 | --- a/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7442 | +++ b/clang/test/CodeGenOpenCL/address-spaces-conversions.cl | ||
| 7443 | @@ -1,5 +1,7 @@ | ||
| 7444 | // RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -ffake-address-space-map -cl-std=CL2.0 -emit-llvm -o - | FileCheck %s | ||
| 7445 | +// RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -ffake-address-space-map -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -emit-llvm -o - | FileCheck %s | ||
| 7446 | // RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -cl-std=CL2.0 -emit-llvm -o - | FileCheck --check-prefix=CHECK-NOFAKE %s | ||
| 7447 | +// RUN: %clang_cc1 %s -triple x86_64-unknown-linux-gnu -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -emit-llvm -o - | FileCheck --check-prefix=CHECK-NOFAKE %s | ||
| 7448 | // When -ffake-address-space-map is not used, all addr space mapped to 0 for x86_64. | ||
| 7449 | |||
| 7450 | // test that we generate address space casts everywhere we need conversions of | ||
| 7451 | diff --git a/clang/test/CodeGenOpenCL/address-spaces-mangling.cl b/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7452 | index 50622f099143..e19ec8451d0d 100644 | ||
| 7453 | --- a/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7454 | +++ b/clang/test/CodeGenOpenCL/address-spaces-mangling.cl | ||
| 7455 | @@ -6,6 +6,7 @@ | ||
| 7456 | // We check that the address spaces are mangled the same in both version of OpenCL | ||
| 7457 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL2.0 -emit-llvm -o - | FileCheck -check-prefix=OCL-20 %s | ||
| 7458 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL1.2 -emit-llvm -o - | FileCheck -check-prefix=OCL-12 %s | ||
| 7459 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL3.0 -emit-llvm -o - | FileCheck -check-prefix=OCL-12 %s | ||
| 7460 | |||
| 7461 | // We can't name this f as private is equivalent to default | ||
| 7462 | // no specifier given address space so we get multiple definition | ||
| 7463 | @@ -47,7 +48,7 @@ void f(constant int *arg) { } | ||
| 7464 | // OCL-20-DAG: @_Z1fPU3AS2i | ||
| 7465 | // OCL-12-DAG: @_Z1fPU3AS2i | ||
| 7466 | |||
| 7467 | -#if __OPENCL_C_VERSION__ >= 200 | ||
| 7468 | +#if __OPENCL_C_VERSION__ == 200 | ||
| 7469 | __attribute__((overloadable)) | ||
| 7470 | void f(generic int *arg) { } | ||
| 7471 | // ASMANG20: @_Z1fPU3AS4i | ||
| 7472 | diff --git a/clang/test/CodeGenOpenCL/address-spaces.cl b/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7473 | index 144466a690b3..b150e1080b53 100644 | ||
| 7474 | --- a/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7475 | +++ b/clang/test/CodeGenOpenCL/address-spaces.cl | ||
| 7476 | @@ -1,9 +1,13 @@ | ||
| 7477 | // RUN: %clang_cc1 %s -O0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CHECK,SPIR | ||
| 7478 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CHECK,SPIR | ||
| 7479 | // RUN: %clang_cc1 %s -O0 -DCL20 -cl-std=CL2.0 -ffake-address-space-map -emit-llvm -o - | FileCheck %s --check-prefixes=CL20,CL20SPIR | ||
| 7480 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-amd-amdhsa -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7481 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple amdgcn-amd-amdhsa -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7482 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-amd-amdhsa -DCL20 -cl-std=CL2.0 -emit-llvm -o - | FileCheck %s --check-prefixes=CL20,CL20AMDGCN | ||
| 7483 | // RUN: %clang_cc1 %s -O0 -triple amdgcn-mesa-mesa3d -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7484 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple amdgcn-mesa-mesa3d -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7485 | // RUN: %clang_cc1 %s -O0 -triple r600-- -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7486 | +// RUN: %clang_cc1 %s -O0 -cl-std=CL3.0 -triple r600-- -emit-llvm -o - | FileCheck --check-prefixes=CHECK,AMDGCN %s | ||
| 7487 | |||
| 7488 | // SPIR: %struct.S = type { i32, i32, i32* } | ||
| 7489 | // CL20SPIR: %struct.S = type { i32, i32, i32 addrspace(4)* } | ||
| 7490 | diff --git a/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl b/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7491 | index 7216cb517495..8d3b30fe8074 100644 | ||
| 7492 | --- a/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7493 | +++ b/clang/test/CodeGenOpenCL/amdgcn-automatic-variable.cl | ||
| 7494 | @@ -1,4 +1,5 @@ | ||
| 7495 | // RUN: %clang_cc1 -O0 -cl-std=CL1.2 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL12 %s | ||
| 7496 | +// RUN: %clang_cc1 -O0 -cl-std=CL3.0 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL12 %s | ||
| 7497 | // RUN: %clang_cc1 -O0 -cl-std=CL2.0 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL20 %s | ||
| 7498 | |||
| 7499 | // CL12-LABEL: define void @func1(i32 addrspace(5)* %x) | ||
| 7500 | diff --git a/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl b/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7501 | index a5d438933fa4..8073c7756eb6 100644 | ||
| 7502 | --- a/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7503 | +++ b/clang/test/CodeGenOpenCL/amdgpu-sizeof-alignof.cl | ||
| 7504 | @@ -4,6 +4,17 @@ | ||
| 7505 | // RUN: %clang_cc1 -triple amdgcn---opencl -cl-std=CL2.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7506 | // RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL1.2 %s -emit-llvm -o - | FileCheck %s | ||
| 7507 | // RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL2.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7508 | +// RUN: %clang_cc1 -triple r600 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7509 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7510 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7511 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7512 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7513 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7514 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-ext=__opencl_c_generic_address_space -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7515 | +// RUN: %clang_cc1 -triple r600 -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7516 | +// RUN: %clang_cc1 -triple amdgcn-mesa-mesa3d -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7517 | +// RUN: %clang_cc1 -triple amdgcn---opencl -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7518 | +// RUN: %clang_cc1 -triple amdgcn---amdgizcl -cl-ext=__opencl_c_fp64 -cl-std=CL3.0 %s -emit-llvm -o - | FileCheck %s | ||
| 7519 | |||
| 7520 | #ifdef __AMDGCN__ | ||
| 7521 | #define PTSIZE 8 | ||
| 7522 | @@ -11,7 +22,7 @@ | ||
| 7523 | #define PTSIZE 4 | ||
| 7524 | #endif | ||
| 7525 | |||
| 7526 | -#ifdef cl_khr_fp64 | ||
| 7527 | +#if defined(cl_khr_fp64) || defined(__opencl_c_fp64) | ||
| 7528 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 7529 | #endif | ||
| 7530 | #ifdef cl_khr_fp16 | ||
| 7531 | @@ -59,8 +70,12 @@ void test() { | ||
| 7532 | check(__alignof__(double) == 8); | ||
| 7533 | #endif | ||
| 7534 | |||
| 7535 | - check(sizeof(void*) == (__OPENCL_C_VERSION__ >= 200 ? 8 : 4)); | ||
| 7536 | - check(__alignof__(void*) == (__OPENCL_C_VERSION__ >= 200 ? 8 : 4)); | ||
| 7537 | + check(sizeof(private void*) == 4); | ||
| 7538 | + check(__alignof__(private void*) == 4); | ||
| 7539 | +#ifdef __opencl_c_generic_address_space | ||
| 7540 | + check(sizeof(generic void*) == 8); | ||
| 7541 | + check(__alignof__(generic void*) == 8); | ||
| 7542 | +#endif | ||
| 7543 | check(sizeof(global_ptr_t) == PTSIZE); | ||
| 7544 | check(__alignof__(global_ptr_t) == PTSIZE); | ||
| 7545 | check(sizeof(constant_ptr_t) == PTSIZE); | ||
| 7546 | diff --git a/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl b/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7547 | index d1ab6aceac5c..70c5bace023b 100644 | ||
| 7548 | --- a/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7549 | +++ b/clang/test/CodeGenOpenCL/arm-integer-dot-product.cl | ||
| 7550 | @@ -1,4 +1,5 @@ | ||
| 7551 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -finclude-default-header -cl-std=CL1.2 -emit-llvm -o - -O0 | FileCheck %s | ||
| 7552 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -finclude-default-header -cl-std=CL3.0 -emit-llvm -o - -O0 | FileCheck %s | ||
| 7553 | |||
| 7554 | #pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : enable | ||
| 7555 | void test_int8(uchar4 ua, uchar4 ub, char4 sa, char4 sb) { | ||
| 7556 | diff --git a/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl b/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7557 | index 76ace5dca21e..5dc43e222f75 100644 | ||
| 7558 | --- a/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7559 | +++ b/clang/test/CodeGenOpenCL/cl-uniform-wg-size.cl | ||
| 7560 | @@ -1,6 +1,8 @@ | ||
| 7561 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL1.2 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7562 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-NONUNIFORM | ||
| 7563 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -cl-uniform-work-group-size -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7564 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-NONUNIFORM | ||
| 7565 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -cl-uniform-work-group-size -o - %s 2>&1 | FileCheck %s -check-prefixes CHECK,CHECK-UNIFORM | ||
| 7566 | |||
| 7567 | kernel void ker() {}; | ||
| 7568 | // CHECK: define{{.*}}@ker() #0 | ||
| 7569 | diff --git a/clang/test/CodeGenOpenCL/fpmath.cl b/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7570 | index 0108d909c94e..b28392739c71 100644 | ||
| 7571 | --- a/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7572 | +++ b/clang/test/CodeGenOpenCL/fpmath.cl | ||
| 7573 | @@ -2,6 +2,8 @@ | ||
| 7574 | // RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown -cl-fp32-correctly-rounded-divide-sqrt | FileCheck --check-prefix=CHECK --check-prefix=DIVOPT %s | ||
| 7575 | // RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL1.2 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s | ||
| 7576 | // RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL1.2 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s | ||
| 7577 | +// RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL3.0 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s | ||
| 7578 | +// RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s | ||
| 7579 | |||
| 7580 | typedef __attribute__(( ext_vector_type(4) )) float float4; | ||
| 7581 | |||
| 7582 | diff --git a/clang/test/CodeGenOpenCL/generic-address-space-feature.cl b/clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 7583 | new file mode 100644 | ||
| 7584 | index 000000000000..890860abe4d9 | ||
| 7585 | --- /dev/null | ||
| 7586 | +++ b/clang/test/CodeGenOpenCL/generic-address-space-feature.cl | ||
| 7587 | @@ -0,0 +1,28 @@ | ||
| 7588 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL12 | ||
| 7589 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL12 | ||
| 7590 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL20 | ||
| 7591 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL20 | ||
| 7592 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64 -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL30 | ||
| 7593 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64,__opencl_c_generic_address_space -finclude-default-header -emit-llvm -o - | FileCheck %s --check-prefixes=CL30-GENERIC | ||
| 7594 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64 -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL30 | ||
| 7595 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -O0 -cl-std=CL3.0 -cl-ext=-cl_khr_fp64,__opencl_c_generic_address_space -fdeclare-opencl-builtins -emit-llvm -o - | FileCheck %s --check-prefixes=CL30-GENERIC | ||
| 7596 | + | ||
| 7597 | +void test(global float* src1, local float *src2, private float *src3, float *src4, float tmp) { | ||
| 7598 | + // CL20: %{{.+}} = addrspacecast float addrspace(1)* %{{.+}} to float addrspace(4)* | ||
| 7599 | + // CL12-NOT: addrspacecast | ||
| 7600 | + // CL30-NOT: addrspacecast | ||
| 7601 | + // CL30-GENERIC-NOT: addrspacecast | ||
| 7602 | + tmp = sincos(tmp, src1); | ||
| 7603 | + // CL20: %{{.+}} = addrspacecast float addrspace(3)* %{{.+}} to float addrspace(4)* | ||
| 7604 | + // CL12-NOT: addrspacecast | ||
| 7605 | + // CL30-NOT: addrspacecast | ||
| 7606 | + // CL30-GENERIC-NOT: addrspacecast | ||
| 7607 | + tmp = sincos(tmp, src2); | ||
| 7608 | + | ||
| 7609 | + // CL12: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float* {{.+}}) | ||
| 7610 | + // CL20: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float addrspace(4)* {{.+}}) | ||
| 7611 | + // CL30: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float* {{.+}}) | ||
| 7612 | + // CL30-GENERIC: %{{.+}} = call {{(spir_func )?}}float [[FUNCNAME:@.*sincos.*]](float %{{.+}}, float addrspace(4)* {{.+}}) | ||
| 7613 | + // CHECK: addrspacecast | ||
| 7614 | + tmp = sincos(tmp, src4); | ||
| 7615 | +} | ||
| 7616 | diff --git a/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl b/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7617 | index 515f13f6e768..5aa31ac6f345 100644 | ||
| 7618 | --- a/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7619 | +++ b/clang/test/CodeGenOpenCL/intel-subgroups-avc-ext-types.cl | ||
| 7620 | @@ -1,4 +1,5 @@ | ||
| 7621 | // RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL1.2 -cl-ext=+cl_intel_device_side_avc_motion_estimation -emit-llvm -o - -O0 | FileCheck %s | ||
| 7622 | +// RUN: %clang_cc1 %s -triple spir-unknown-unknown -cl-std=CL3.0 -cl-ext=+cl_intel_device_side_avc_motion_estimation -emit-llvm -o - -O0 | FileCheck %s | ||
| 7623 | |||
| 7624 | // CHECK: %opencl.intel_sub_group_avc_mce_payload_t = type opaque | ||
| 7625 | // CHECK: %opencl.intel_sub_group_avc_ime_payload_t = type opaque | ||
| 7626 | diff --git a/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl b/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7627 | index e89237623478..3d6708ac361f 100644 | ||
| 7628 | --- a/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7629 | +++ b/clang/test/CodeGenOpenCL/kernels-have-spir-cc-by-default.cl | ||
| 7630 | @@ -1,5 +1,8 @@ | ||
| 7631 | // RUN: %clang_cc1 %s -cl-std=CL1.2 -emit-llvm -triple x86_64-unknown-unknown -o - | FileCheck %s | ||
| 7632 | // RUN: %clang_cc1 %s -cl-std=CL1.2 -emit-llvm -triple amdgcn-unknown-unknown -o - | FileCheck -check-prefixes=AMDGCN %s | ||
| 7633 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -triple x86_64-unknown-unknown -o - | FileCheck %s | ||
| 7634 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -triple amdgcn-unknown-unknown -o - | FileCheck -check-prefixes=AMDGCN %s | ||
| 7635 | + | ||
| 7636 | // Test that the kernels always use the SPIR calling convention | ||
| 7637 | // to have unambiguous mapping of arguments to feasibly implement | ||
| 7638 | // clSetKernelArg(). | ||
| 7639 | diff --git a/clang/test/CodeGenOpenCL/logical-ops.cl b/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7640 | index f083a8580ee7..499eab65039b 100644 | ||
| 7641 | --- a/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7642 | +++ b/clang/test/CodeGenOpenCL/logical-ops.cl | ||
| 7643 | @@ -1,4 +1,5 @@ | ||
| 7644 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL1.2 -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7645 | +// RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7646 | // RUN: %clang_cc1 %s -emit-llvm -o - -cl-std=clc++ -O1 -triple x86_64-unknown-linux-gnu | FileCheck %s | ||
| 7647 | |||
| 7648 | #pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 7649 | diff --git a/clang/test/CodeGenOpenCL/no-half.cl b/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7650 | index aee8f678f01a..46da7fa339e8 100644 | ||
| 7651 | --- a/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7652 | +++ b/clang/test/CodeGenOpenCL/no-half.cl | ||
| 7653 | @@ -1,6 +1,7 @@ | ||
| 7654 | // RUN: %clang_cc1 %s -cl-std=cl2.0 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7655 | // RUN: %clang_cc1 %s -cl-std=cl1.2 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7656 | // RUN: %clang_cc1 %s -cl-std=cl1.1 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7657 | +// RUN: %clang_cc1 %s -cl-std=cl3.0 -cl-ext=__opencl_c_fp64 -emit-llvm -o - -triple spir-unknown-unknown | FileCheck %s | ||
| 7658 | |||
| 7659 | #pragma OPENCL EXTENSION cl_khr_fp64:enable | ||
| 7660 | |||
| 7661 | diff --git a/clang/test/CodeGenOpenCL/pipe_builtin.cl b/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7662 | index 02b9669b7ab1..0bf35c336199 100644 | ||
| 7663 | --- a/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7664 | +++ b/clang/test/CodeGenOpenCL/pipe_builtin.cl | ||
| 7665 | @@ -1,4 +1,7 @@ | ||
| 7666 | // RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=clc++ -o - %s | FileCheck %s | ||
| 7667 | +// RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=cl2.0 -o - %s | FileCheck %s | ||
| 7668 | +// RUN: %clang_cc1 -triple %itanium_abi_triple -emit-llvm -cl-ext=+cl_khr_subgroups -O0 -cl-std=cl3.0 -cl-ext=__opencl_c_pipes,__opencl_c_subgroups -o - %s | FileCheck %s | ||
| 7669 | + | ||
| 7670 | // FIXME: Add MS ABI manglings of OpenCL things and remove %itanium_abi_triple | ||
| 7671 | // above to support OpenCL in the MS C++ ABI. | ||
| 7672 | |||
| 7673 | diff --git a/clang/test/CodeGenOpenCL/pipe_types.cl b/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7674 | index ba064c6d7557..b7a523d4f084 100644 | ||
| 7675 | --- a/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7676 | +++ b/clang/test/CodeGenOpenCL/pipe_types.cl | ||
| 7677 | @@ -1,4 +1,5 @@ | ||
| 7678 | // RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -emit-llvm -O0 -cl-std=CL2.0 -o - %s | FileCheck %s | ||
| 7679 | +// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -emit-llvm -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -o - %s | FileCheck %s | ||
| 7680 | |||
| 7681 | // CHECK: %opencl.pipe_ro_t = type opaque | ||
| 7682 | // CHECK: %opencl.pipe_wo_t = type opaque | ||
| 7683 | diff --git a/clang/test/CodeGenOpenCL/printf.cl b/clang/test/CodeGenOpenCL/printf.cl | ||
| 7684 | index fc139d776db6..0133c5595d81 100644 | ||
| 7685 | --- a/clang/test/CodeGenOpenCL/printf.cl | ||
| 7686 | +++ b/clang/test/CodeGenOpenCL/printf.cl | ||
| 7687 | @@ -1,5 +1,7 @@ | ||
| 7688 | // RUN: %clang_cc1 -cl-std=CL1.2 -cl-ext=-+cl_khr_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=FP64,ALL %s | ||
| 7689 | // RUN: %clang_cc1 -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=NOFP64,ALL %s | ||
| 7690 | +// RUN: %clang_cc1 -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=FP64,ALL %s | ||
| 7691 | +// RUN: %clang_cc1 -cl-std=CL3.0 -triple spir-unknown-unknown -disable-llvm-passes -emit-llvm -o - %s | FileCheck -check-prefixes=NOFP64,ALL %s | ||
| 7692 | |||
| 7693 | typedef __attribute__((ext_vector_type(2))) float float2; | ||
| 7694 | typedef __attribute__((ext_vector_type(2))) half half2; | ||
| 7695 | diff --git a/clang/test/CodeGenOpenCL/unroll-hint.cl b/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7696 | index 0f84450a1ae6..9347c935869b 100644 | ||
| 7697 | --- a/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7698 | +++ b/clang/test/CodeGenOpenCL/unroll-hint.cl | ||
| 7699 | @@ -1,5 +1,6 @@ | ||
| 7700 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL2.0 -o - %s | FileCheck %s | ||
| 7701 | // RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL1.2 -o - %s | FileCheck %s | ||
| 7702 | +// RUN: %clang_cc1 -emit-llvm -O0 -cl-std=CL3.0 -o - %s | FileCheck %s | ||
| 7703 | |||
| 7704 | /*** for ***/ | ||
| 7705 | void for_count() | ||
| 7706 | diff --git a/clang/test/Driver/autocomplete.c b/clang/test/Driver/autocomplete.c | ||
| 7707 | index 18b31320ea80..a6e7be887c8c 100644 | ||
| 7708 | --- a/clang/test/Driver/autocomplete.c | ||
| 7709 | +++ b/clang/test/Driver/autocomplete.c | ||
| 7710 | @@ -43,6 +43,8 @@ | ||
| 7711 | // CLSTDALL-NEXT: CL1.2 | ||
| 7712 | // CLSTDALL-NEXT: cl2.0 | ||
| 7713 | // CLSTDALL-NEXT: CL2.0 | ||
| 7714 | +// CLSTDALL-NEXT: cl3.0 | ||
| 7715 | +// CLSTDALL-NEXT: CL3.0 | ||
| 7716 | // CLSTDALL-NEXT: clc++ | ||
| 7717 | // CLSTDALL-NEXT: CLC++ | ||
| 7718 | // RUN: %clang --autocomplete=-fno-sanitize-coverage=,f | FileCheck %s -check-prefix=FNOSANICOVER | ||
| 7719 | diff --git a/clang/test/Driver/opencl.cl b/clang/test/Driver/opencl.cl | ||
| 7720 | index 05588f2c8b81..cc0a9143ab37 100644 | ||
| 7721 | --- a/clang/test/Driver/opencl.cl | ||
| 7722 | +++ b/clang/test/Driver/opencl.cl | ||
| 7723 | @@ -2,6 +2,7 @@ | ||
| 7724 | // RUN: %clang -S -### -cl-std=CL1.1 %s 2>&1 | FileCheck --check-prefix=CHECK-CL11 %s | ||
| 7725 | // RUN: %clang -S -### -cl-std=CL1.2 %s 2>&1 | FileCheck --check-prefix=CHECK-CL12 %s | ||
| 7726 | // RUN: %clang -S -### -cl-std=CL2.0 %s 2>&1 | FileCheck --check-prefix=CHECK-CL20 %s | ||
| 7727 | +// RUN: %clang -S -### -cl-std=CL3.0 %s 2>&1 | FileCheck --check-prefix=CHECK-CL30 %s | ||
| 7728 | // RUN: %clang -S -### -cl-std=clc++ %s 2>&1 | FileCheck --check-prefix=CHECK-CLCPP %s | ||
| 7729 | // RUN: %clang -S -### -cl-opt-disable %s 2>&1 | FileCheck --check-prefix=CHECK-OPT-DISABLE %s | ||
| 7730 | // RUN: %clang -S -### -cl-strict-aliasing %s 2>&1 | FileCheck --check-prefix=CHECK-STRICT-ALIASING %s | ||
| 7731 | @@ -22,6 +23,7 @@ | ||
| 7732 | // CHECK-CL11: "-cc1" {{.*}} "-cl-std=CL1.1" | ||
| 7733 | // CHECK-CL12: "-cc1" {{.*}} "-cl-std=CL1.2" | ||
| 7734 | // CHECK-CL20: "-cc1" {{.*}} "-cl-std=CL2.0" | ||
| 7735 | +// CHECK-CL30: "-cc1" {{.*}} "-cl-std=CL3.0" | ||
| 7736 | // CHECK-CLCPP: "-cc1" {{.*}} "-cl-std=clc++" | ||
| 7737 | // CHECK-OPT-DISABLE: "-cc1" {{.*}} "-cl-opt-disable" | ||
| 7738 | // CHECK-STRICT-ALIASING: "-cc1" {{.*}} "-cl-strict-aliasing" | ||
| 7739 | diff --git a/clang/test/Driver/unknown-std.cl b/clang/test/Driver/unknown-std.cl | ||
| 7740 | index 6f371bac13ac..00209fb62556 100644 | ||
| 7741 | --- a/clang/test/Driver/unknown-std.cl | ||
| 7742 | +++ b/clang/test/Driver/unknown-std.cl | ||
| 7743 | @@ -10,6 +10,7 @@ | ||
| 7744 | // CHECK-NEXT: note: use 'cl1.1' for 'OpenCL 1.1' standard | ||
| 7745 | // CHECK-NEXT: note: use 'cl1.2' for 'OpenCL 1.2' standard | ||
| 7746 | // CHECK-NEXT: note: use 'cl2.0' for 'OpenCL 2.0' standard | ||
| 7747 | +// CHECK-NEXT: note: use 'cl3.0' for 'OpenCL 3.0' standard | ||
| 7748 | // CHECK-NEXT: note: use 'clc++' for 'C++ for OpenCL' standard | ||
| 7749 | |||
| 7750 | // Make sure that no other output is present. | ||
| 7751 | diff --git a/clang/test/Frontend/stdlang.c b/clang/test/Frontend/stdlang.c | ||
| 7752 | index 51484999e37a..eac4632fbdd6 100644 | ||
| 7753 | --- a/clang/test/Frontend/stdlang.c | ||
| 7754 | +++ b/clang/test/Frontend/stdlang.c | ||
| 7755 | @@ -9,6 +9,7 @@ | ||
| 7756 | // RUN: %clang_cc1 -x cl -cl-std=CL1.1 -DOPENCL %s | ||
| 7757 | // RUN: %clang_cc1 -x cl -cl-std=CL1.2 -DOPENCL %s | ||
| 7758 | // RUN: %clang_cc1 -x cl -cl-std=CL2.0 -DOPENCL %s | ||
| 7759 | +// RUN: %clang_cc1 -x cl -cl-std=CL3.0 -DOPENCL %s | ||
| 7760 | // RUN: %clang_cc1 -x cl -cl-std=CLC++ -DOPENCL %s | ||
| 7761 | // RUN: not %clang_cc1 -x cl -std=c99 -DOPENCL %s 2>&1 | FileCheck --check-prefix=CHECK-C99 %s | ||
| 7762 | // RUN: not %clang_cc1 -x cl -cl-std=invalid -DOPENCL %s 2>&1 | FileCheck --check-prefix=CHECK-INVALID %s | ||
| 7763 | diff --git a/clang/test/Headers/opencl-c-header.cl b/clang/test/Headers/opencl-c-header.cl | ||
| 7764 | index 1b151ffdd16a..2716076acdcf 100644 | ||
| 7765 | --- a/clang/test/Headers/opencl-c-header.cl | ||
| 7766 | +++ b/clang/test/Headers/opencl-c-header.cl | ||
| 7767 | @@ -1,6 +1,7 @@ | ||
| 7768 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify | FileCheck %s | ||
| 7769 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL1.1 | FileCheck %s | ||
| 7770 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL1.2 | FileCheck %s | ||
| 7771 | +// RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=CL3.0 | FileCheck %s | ||
| 7772 | // RUN: %clang_cc1 -O0 -triple spir-unknown-unknown -internal-isystem ../../lib/Headers -include opencl-c.h -emit-llvm -o - %s -verify -cl-std=clc++ | FileCheck %s --check-prefix=CHECK20 | ||
| 7773 | |||
| 7774 | // Test including the default header as a module. | ||
| 7775 | @@ -39,9 +40,11 @@ | ||
| 7776 | // RUN: rm -rf %t | ||
| 7777 | // RUN: mkdir -p %t | ||
| 7778 | // RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL1.2 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7779 | +// RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL3.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7780 | // RUN: %clang_cc1 -triple amdgcn--amdhsa -O0 -emit-llvm -o - -cl-std=CL2.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK20 --check-prefix=CHECK-MOD %s | ||
| 7781 | // RUN: chmod u-w %t | ||
| 7782 | // RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL1.2 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7783 | +// RUN: %clang_cc1 -triple spir64-unknown-unknown -emit-llvm -o - -cl-std=CL3.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK --check-prefix=CHECK-MOD %s | ||
| 7784 | // RUN: %clang_cc1 -triple amdgcn--amdhsa -O0 -emit-llvm -o - -cl-std=CL2.0 -finclude-default-header -fmodules -fimplicit-module-maps -fmodules-cache-path=%t -ftime-report %s 2>&1 | FileCheck --check-prefix=CHECK20 --check-prefix=CHECK-MOD %s | ||
| 7785 | // RUN: chmod u+w %t | ||
| 7786 | |||
| 7787 | @@ -67,7 +70,7 @@ char f(char x) { | ||
| 7788 | // from OpenCL 2.0 onwards. | ||
| 7789 | |||
| 7790 | // CHECK20: _Z12write_imagef14ocl_image3d_wo | ||
| 7791 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 7792 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 7793 | void test_image3dwo(write_only image3d_t img) { | ||
| 7794 | write_imagef(img, (0), (0.0f)); | ||
| 7795 | } | ||
| 7796 | @@ -81,7 +84,7 @@ void test_atomics(__generic volatile unsigned int* a) { | ||
| 7797 | #endif | ||
| 7798 | |||
| 7799 | // Verify that ATOMIC_VAR_INIT is defined. | ||
| 7800 | -#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 7801 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 7802 | global atomic_int z = ATOMIC_VAR_INIT(99); | ||
| 7803 | #endif //__OPENCL_C_VERSION__ | ||
| 7804 | |||
| 7805 | diff --git a/clang/test/Index/pipe-size.cl b/clang/test/Index/pipe-size.cl | ||
| 7806 | index 94a1255f0a48..59b76051eda1 100644 | ||
| 7807 | --- a/clang/test/Index/pipe-size.cl | ||
| 7808 | +++ b/clang/test/Index/pipe-size.cl | ||
| 7809 | @@ -2,6 +2,13 @@ | ||
| 7810 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple spir-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR | ||
| 7811 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple spir64-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR64 | ||
| 7812 | // RUN: %clang_cc1 -x cl -O0 -cl-std=CL2.0 -emit-llvm -triple amdgcn-amd-amdhsa %s -o - | FileCheck %s --check-prefix=AMDGCN | ||
| 7813 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple x86_64-unknown-linux-gnu %s -o - | FileCheck %s --check-prefix=X86 | ||
| 7814 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple spir-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR | ||
| 7815 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple spir64-unknown-unknown %s -o - | FileCheck %s --check-prefix=SPIR64 | ||
| 7816 | +// RUN: %clang_cc1 -x cl -O0 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -emit-llvm -triple amdgcn-amd-amdhsa %s -o - | FileCheck %s --check-prefix=AMDGCN | ||
| 7817 | + | ||
| 7818 | + | ||
| 7819 | + | ||
| 7820 | __kernel void testPipe( pipe int test ) | ||
| 7821 | { | ||
| 7822 | int s = sizeof(test); | ||
| 7823 | diff --git a/clang/test/Preprocessor/init-aarch64.c b/clang/test/Preprocessor/init-aarch64.c | ||
| 7824 | index df2a6128989b..cbb0995b48b0 100644 | ||
| 7825 | --- a/clang/test/Preprocessor/init-aarch64.c | ||
| 7826 | +++ b/clang/test/Preprocessor/init-aarch64.c | ||
| 7827 | @@ -109,12 +109,12 @@ | ||
| 7828 | // AARCH64-NEXT: #define __GCC_HAVE_SYNC_COMPARE_AND_SWAP_8 1 | ||
| 7829 | // AARCH64_CXX-NEXT: #define __GLIBCXX_BITSIZE_INT_N_0 128 | ||
| 7830 | // AARCH64_CXX-NEXT: #define __GLIBCXX_TYPE_INT_N_0 __int128 | ||
| 7831 | -// AARCH64-NEXT: #define __INT16_C_SUFFIX__ | ||
| 7832 | +// AARCH64-NEXT: #define __INT16_C_SUFFIX__ | ||
| 7833 | // AARCH64-NEXT: #define __INT16_FMTd__ "hd" | ||
| 7834 | // AARCH64-NEXT: #define __INT16_FMTi__ "hi" | ||
| 7835 | // AARCH64-NEXT: #define __INT16_MAX__ 32767 | ||
| 7836 | // AARCH64-NEXT: #define __INT16_TYPE__ short | ||
| 7837 | -// AARCH64-NEXT: #define __INT32_C_SUFFIX__ | ||
| 7838 | +// AARCH64-NEXT: #define __INT32_C_SUFFIX__ | ||
| 7839 | // AARCH64-NEXT: #define __INT32_FMTd__ "d" | ||
| 7840 | // AARCH64-NEXT: #define __INT32_FMTi__ "i" | ||
| 7841 | // AARCH64-NEXT: #define __INT32_MAX__ 2147483647 | ||
| 7842 | @@ -124,7 +124,7 @@ | ||
| 7843 | // AARCH64-NEXT: #define __INT64_FMTi__ "li" | ||
| 7844 | // AARCH64-NEXT: #define __INT64_MAX__ 9223372036854775807L | ||
| 7845 | // AARCH64-NEXT: #define __INT64_TYPE__ long int | ||
| 7846 | -// AARCH64-NEXT: #define __INT8_C_SUFFIX__ | ||
| 7847 | +// AARCH64-NEXT: #define __INT8_C_SUFFIX__ | ||
| 7848 | // AARCH64-NEXT: #define __INT8_FMTd__ "hhd" | ||
| 7849 | // AARCH64-NEXT: #define __INT8_FMTi__ "hhi" | ||
| 7850 | // AARCH64-NEXT: #define __INT8_MAX__ 127 | ||
| 7851 | @@ -238,7 +238,7 @@ | ||
| 7852 | // AARCH64-NEXT: #define __STDC_UTF_32__ 1 | ||
| 7853 | // AARCH64_C: #define __STDC_VERSION__ 201710L | ||
| 7854 | // AARCH64-NEXT: #define __STDC__ 1 | ||
| 7855 | -// AARCH64-NEXT: #define __UINT16_C_SUFFIX__ | ||
| 7856 | +// AARCH64-NEXT: #define __UINT16_C_SUFFIX__ | ||
| 7857 | // AARCH64-NEXT: #define __UINT16_FMTX__ "hX" | ||
| 7858 | // AARCH64-NEXT: #define __UINT16_FMTo__ "ho" | ||
| 7859 | // AARCH64-NEXT: #define __UINT16_FMTu__ "hu" | ||
| 7860 | @@ -259,7 +259,7 @@ | ||
| 7861 | // AARCH64-NEXT: #define __UINT64_FMTx__ "lx" | ||
| 7862 | // AARCH64-NEXT: #define __UINT64_MAX__ 18446744073709551615UL | ||
| 7863 | // AARCH64-NEXT: #define __UINT64_TYPE__ long unsigned int | ||
| 7864 | -// AARCH64-NEXT: #define __UINT8_C_SUFFIX__ | ||
| 7865 | +// AARCH64-NEXT: #define __UINT8_C_SUFFIX__ | ||
| 7866 | // AARCH64-NEXT: #define __UINT8_FMTX__ "hhX" | ||
| 7867 | // AARCH64-NEXT: #define __UINT8_FMTo__ "hho" | ||
| 7868 | // AARCH64-NEXT: #define __UINT8_FMTu__ "hhu" | ||
| 7869 | @@ -329,7 +329,7 @@ | ||
| 7870 | // AARCH64-NEXT: #define __UINT_LEAST8_FMTx__ "hhx" | ||
| 7871 | // AARCH64-NEXT: #define __UINT_LEAST8_MAX__ 255 | ||
| 7872 | // AARCH64-NEXT: #define __UINT_LEAST8_TYPE__ unsigned char | ||
| 7873 | -// AARCH64-NEXT: #define __USER_LABEL_PREFIX__ | ||
| 7874 | +// AARCH64-NEXT: #define __USER_LABEL_PREFIX__ | ||
| 7875 | // AARCH64-NEXT: #define __VERSION__ "{{.*}}" | ||
| 7876 | // AARCH64-NEXT: #define __WCHAR_MAX__ 4294967295U | ||
| 7877 | // AARCH64-NEXT: #define __WCHAR_TYPE__ unsigned int | ||
| 7878 | diff --git a/clang/test/Preprocessor/predefined-macros.c b/clang/test/Preprocessor/predefined-macros.c | ||
| 7879 | index 083f0e539d88..6c80517ec4d4 100644 | ||
| 7880 | --- a/clang/test/Preprocessor/predefined-macros.c | ||
| 7881 | +++ b/clang/test/Preprocessor/predefined-macros.c | ||
| 7882 | @@ -129,6 +129,8 @@ | ||
| 7883 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL12 | ||
| 7884 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=CL2.0 \ | ||
| 7885 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL20 | ||
| 7886 | +// RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=CL3.0 \ | ||
| 7887 | +// RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-CL30 | ||
| 7888 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-fast-relaxed-math \ | ||
| 7889 | // RUN: | FileCheck -match-full-lines %s --check-prefix=CHECK-FRM | ||
| 7890 | // RUN: %clang_cc1 %s -E -dM -o - -x cl -cl-std=clc++ \ | ||
| 7891 | @@ -137,26 +139,37 @@ | ||
| 7892 | // CHECK-CL10: #define CL_VERSION_1_1 110 | ||
| 7893 | // CHECK-CL10: #define CL_VERSION_1_2 120 | ||
| 7894 | // CHECK-CL10: #define CL_VERSION_2_0 200 | ||
| 7895 | +// CHECK-CL10: #define CL_VERSION_3_0 300 | ||
| 7896 | // CHECK-CL10: #define __OPENCL_C_VERSION__ 100 | ||
| 7897 | // CHECK-CL10-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7898 | // CHECK-CL11: #define CL_VERSION_1_0 100 | ||
| 7899 | // CHECK-CL11: #define CL_VERSION_1_1 110 | ||
| 7900 | // CHECK-CL11: #define CL_VERSION_1_2 120 | ||
| 7901 | // CHECK-CL11: #define CL_VERSION_2_0 200 | ||
| 7902 | +// CHECK-CL11: #define CL_VERSION_3_0 300 | ||
| 7903 | // CHECK-CL11: #define __OPENCL_C_VERSION__ 110 | ||
| 7904 | // CHECK-CL11-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7905 | // CHECK-CL12: #define CL_VERSION_1_0 100 | ||
| 7906 | // CHECK-CL12: #define CL_VERSION_1_1 110 | ||
| 7907 | // CHECK-CL12: #define CL_VERSION_1_2 120 | ||
| 7908 | // CHECK-CL12: #define CL_VERSION_2_0 200 | ||
| 7909 | +// CHECK-CL12: #define CL_VERSION_3_0 300 | ||
| 7910 | // CHECK-CL12: #define __OPENCL_C_VERSION__ 120 | ||
| 7911 | // CHECK-CL12-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7912 | // CHECK-CL20: #define CL_VERSION_1_0 100 | ||
| 7913 | // CHECK-CL20: #define CL_VERSION_1_1 110 | ||
| 7914 | // CHECK-CL20: #define CL_VERSION_1_2 120 | ||
| 7915 | // CHECK-CL20: #define CL_VERSION_2_0 200 | ||
| 7916 | +// CHECK-CL20: #define CL_VERSION_3_0 300 | ||
| 7917 | // CHECK-CL20: #define __OPENCL_C_VERSION__ 200 | ||
| 7918 | // CHECK-CL20-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7919 | +// CHECK-CL30: #define CL_VERSION_1_0 100 | ||
| 7920 | +// CHECK-CL30: #define CL_VERSION_1_1 110 | ||
| 7921 | +// CHECK-CL30: #define CL_VERSION_1_2 120 | ||
| 7922 | +// CHECK-CL30: #define CL_VERSION_2_0 200 | ||
| 7923 | +// CHECK-CL30: #define CL_VERSION_3_0 300 | ||
| 7924 | +// CHECK-CL30: #define __OPENCL_C_VERSION__ 300 | ||
| 7925 | +// CHECK-CL30-NOT: #define __FAST_RELAXED_MATH__ 1 | ||
| 7926 | // CHECK-FRM: #define __FAST_RELAXED_MATH__ 1 | ||
| 7927 | // CHECK-CLCPP10: #define __CL_CPP_VERSION_1_0__ 100 | ||
| 7928 | // CHECK-CLCPP10: #define __OPENCL_CPP_VERSION__ 100 | ||
| 7929 | diff --git a/clang/test/Sema/feature-extensions-simult-support.cl b/clang/test/Sema/feature-extensions-simult-support.cl | ||
| 7930 | new file mode 100644 | ||
| 7931 | index 000000000000..0789105002b2 | ||
| 7932 | --- /dev/null | ||
| 7933 | +++ b/clang/test/Sema/feature-extensions-simult-support.cl | ||
| 7934 | @@ -0,0 +1,75 @@ | ||
| 7935 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_fp64 | ||
| 7936 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_fp64 | ||
| 7937 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_3d_image_writes | ||
| 7938 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_3d_image_writes | ||
| 7939 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=-cl_khr_subgroups | ||
| 7940 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 -cl-ext=+cl_khr_subgroups | ||
| 7941 | + | ||
| 7942 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_fp64 | ||
| 7943 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_fp64 | ||
| 7944 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_3d_image_writes | ||
| 7945 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_3d_image_writes | ||
| 7946 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-cl_khr_subgroups | ||
| 7947 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_subgroups | ||
| 7948 | + | ||
| 7949 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64 | ||
| 7950 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_3d_image_writes | ||
| 7951 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_subgroups | ||
| 7952 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_pipes | ||
| 7953 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_device_enqueue | ||
| 7954 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_read_write_images | ||
| 7955 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_fp64,-cl_khr_fp64 | ||
| 7956 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_3d_image_writes,-cl_khr_3d_image_writes | ||
| 7957 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+__opencl_c_subgroups,-cl_khr_subgroups | ||
| 7958 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_fp64 | ||
| 7959 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_3d_image_writes | ||
| 7960 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=+cl_khr_subgroups | ||
| 7961 | + | ||
| 7962 | +// expected-no-diagnostics | ||
| 7963 | + | ||
| 7964 | +#ifdef cl_khr_fp64 | ||
| 7965 | + #ifndef __opencl_c_fp64 | ||
| 7966 | + #error macros were not properly set up | ||
| 7967 | + #endif | ||
| 7968 | +#endif | ||
| 7969 | +#ifdef __opencl_c_fp64 | ||
| 7970 | + #ifndef cl_khr_fp64 | ||
| 7971 | + #error macros were not properly set up | ||
| 7972 | + #endif | ||
| 7973 | +#endif | ||
| 7974 | + | ||
| 7975 | +#ifdef cl_khr_3d_image_writes | ||
| 7976 | + #ifndef __opencl_c_3d_image_writes | ||
| 7977 | + #error macros were not properly set up | ||
| 7978 | + #endif | ||
| 7979 | +#endif | ||
| 7980 | +#ifdef __opencl_c_3d_image_writes | ||
| 7981 | + #ifndef cl_khr_3d_image_writes | ||
| 7982 | + #error macros were not properly set up | ||
| 7983 | + #endif | ||
| 7984 | +#endif | ||
| 7985 | + | ||
| 7986 | +#ifdef cl_khr_subgroups | ||
| 7987 | + #ifndef __opencl_c_subgroups | ||
| 7988 | + #error macros were not properly set up | ||
| 7989 | + #endif | ||
| 7990 | +#endif | ||
| 7991 | +#ifdef __opencl_c_subgroups | ||
| 7992 | + #ifndef cl_khr_subgroups | ||
| 7993 | + #error macros were not properly set up | ||
| 7994 | + #endif | ||
| 7995 | +#endif | ||
| 7996 | + | ||
| 7997 | +#if defined(__opencl_c_pipes) || defined(__opencl_c_device_enqueue) | ||
| 7998 | + #ifndef __opencl_c_generic_address_space | ||
| 7999 | + #error macros were not properly set up | ||
| 8000 | + #endif | ||
| 8001 | +#endif | ||
| 8002 | + | ||
| 8003 | +#if defined(__opencl_c_3d_image_writes) || defined(__opencl_c_read_write_images) | ||
| 8004 | + #ifndef __opencl_c_images | ||
| 8005 | + #error macros were not properly set up | ||
| 8006 | + #endif | ||
| 8007 | +#endif | ||
| 8008 | + | ||
| 8009 | +kernel void test(){} | ||
| 8010 | diff --git a/clang/test/Sema/features-ignore-pragma.cl b/clang/test/Sema/features-ignore-pragma.cl | ||
| 8011 | new file mode 100644 | ||
| 8012 | index 000000000000..046ce5390754 | ||
| 8013 | --- /dev/null | ||
| 8014 | +++ b/clang/test/Sema/features-ignore-pragma.cl | ||
| 8015 | @@ -0,0 +1,24 @@ | ||
| 8016 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 8017 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_fp64 | ||
| 8018 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_subgroups | ||
| 8019 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_3d_image_writes | ||
| 8020 | + | ||
| 8021 | +#pragma OPENCL EXTENSION __opencl_c_fp64 : enable | ||
| 8022 | +// expected-warning@-1 {{OpenCL feature support can't be controlled via pragma, ignoring}} | ||
| 8023 | + | ||
| 8024 | +#pragma OPENCL EXTENSION cl_khr_fp64 : enable | ||
| 8025 | +#ifndef __opencl_c_fp64 | ||
| 8026 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_fp64' - ignoring}} | ||
| 8027 | +#endif | ||
| 8028 | + | ||
| 8029 | +#pragma OPENCL EXTENSION cl_khr_subgroups : enable | ||
| 8030 | +#ifndef __opencl_c_subgroups | ||
| 8031 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_subgroups' - ignoring}} | ||
| 8032 | +#endif | ||
| 8033 | + | ||
| 8034 | +#pragma OPENCL EXTENSION cl_khr_3d_image_writes : enable | ||
| 8035 | +#ifndef __opencl_c_3d_image_writes | ||
| 8036 | +// expected-warning@-2{{unsupported OpenCL extension 'cl_khr_3d_image_writes' - ignoring}} | ||
| 8037 | +#endif | ||
| 8038 | + | ||
| 8039 | +kernel void foo() {} | ||
| 8040 | diff --git a/clang/test/Sema/opencl-features-pipes.cl b/clang/test/Sema/opencl-features-pipes.cl | ||
| 8041 | new file mode 100644 | ||
| 8042 | index 000000000000..c0ac778f24a6 | ||
| 8043 | --- /dev/null | ||
| 8044 | +++ b/clang/test/Sema/opencl-features-pipes.cl | ||
| 8045 | @@ -0,0 +1,18 @@ | ||
| 8046 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.1 | ||
| 8047 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL1.2 | ||
| 8048 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -DHAS | ||
| 8049 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 8050 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -DHAS | ||
| 8051 | +// expected-no-diagnostics | ||
| 8052 | + | ||
| 8053 | +#ifdef HAS | ||
| 8054 | + #ifndef __opencl_c_pipes | ||
| 8055 | + #error Feature should be defined | ||
| 8056 | + #endif | ||
| 8057 | +#else | ||
| 8058 | + #ifdef __opencl_c_pipes | ||
| 8059 | + #error Feature should not be defined | ||
| 8060 | + #endif | ||
| 8061 | +#endif | ||
| 8062 | + | ||
| 8063 | +kernel void foo() {} | ||
| 8064 | diff --git a/clang/test/Sema/opencl-features.cl b/clang/test/Sema/opencl-features.cl | ||
| 8065 | new file mode 100644 | ||
| 8066 | index 000000000000..aa432f6b60bf | ||
| 8067 | --- /dev/null | ||
| 8068 | +++ b/clang/test/Sema/opencl-features.cl | ||
| 8069 | @@ -0,0 +1,128 @@ | ||
| 8070 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 | ||
| 8071 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=-__opencl_c_device_enqueue,-__opencl_c_pipes,-__opencl_c_read_write_images | ||
| 8072 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CLC++ | ||
| 8073 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 | ||
| 8074 | +// expected-no-diagnostics | ||
| 8075 | + | ||
| 8076 | +#ifndef __opencl_c_int64 | ||
| 8077 | + #error Feature __opencl_c_int64 shouldn't be defined | ||
| 8078 | +#endif | ||
| 8079 | + | ||
| 8080 | +#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ == CL_VERSION_2_0) | ||
| 8081 | + #ifndef __opencl_c_3d_image_writes | ||
| 8082 | + #error Feature __opencl_c_3d_image_writes should be defined | ||
| 8083 | + #endif | ||
| 8084 | + | ||
| 8085 | + #ifndef __opencl_c_atomic_order_acq_rel | ||
| 8086 | + #error Feature __opencl_c_atomic_order_acq_rel should be defined | ||
| 8087 | + #endif | ||
| 8088 | + | ||
| 8089 | + #ifndef __opencl_c_atomic_order_seq_cst | ||
| 8090 | + #error Feature __opencl_c_atomic_order_seq_cst should be defined | ||
| 8091 | + #endif | ||
| 8092 | + | ||
| 8093 | + #ifndef __opencl_c_atomic_scope_device | ||
| 8094 | + #error Feature __opencl_c_atomic_scope_device should be defined | ||
| 8095 | + #endif | ||
| 8096 | + | ||
| 8097 | + #ifndef __opencl_c_atomic_scope_all_devices | ||
| 8098 | + #error Feature __opencl_c_atomic_scope_all_devices should be defined | ||
| 8099 | + #endif | ||
| 8100 | + | ||
| 8101 | + #ifndef __opencl_c_device_enqueue | ||
| 8102 | + #error Feature __opencl_c_device_enqueue should be defined | ||
| 8103 | + #endif | ||
| 8104 | + | ||
| 8105 | + #ifndef __opencl_c_generic_address_space | ||
| 8106 | + #error Feature __opencl_c_generic_address_space should be defined | ||
| 8107 | + #endif | ||
| 8108 | + | ||
| 8109 | + #ifndef __opencl_c_pipes | ||
| 8110 | + #error Feature __opencl_c_pipes should be defined | ||
| 8111 | + #endif | ||
| 8112 | + | ||
| 8113 | + #ifndef __opencl_c_program_scope_global_variables | ||
| 8114 | + #error Feature __opencl_c_program_scope_global_variables should be defined | ||
| 8115 | + #endif | ||
| 8116 | + | ||
| 8117 | + #ifndef __opencl_c_read_write_images | ||
| 8118 | + #error Feature __opencl_c_read_write_images should be defined | ||
| 8119 | + #endif | ||
| 8120 | + | ||
| 8121 | + #ifndef __opencl_c_subgroups | ||
| 8122 | + #error Feature __opencl_c_subgroups should be defined | ||
| 8123 | + #endif | ||
| 8124 | + | ||
| 8125 | + #ifndef __opencl_c_work_group_collective_functions | ||
| 8126 | + #error Feature __opencl_c_work_group_collective_functions should be defined | ||
| 8127 | + #endif | ||
| 8128 | + | ||
| 8129 | + #ifndef __opencl_c_fp64 | ||
| 8130 | + #error Feature __opencl_c_fp64 should be defined | ||
| 8131 | + #endif | ||
| 8132 | + | ||
| 8133 | + #ifndef __opencl_c_images | ||
| 8134 | + #error Feature __opencl_c_images should be defined | ||
| 8135 | + #endif | ||
| 8136 | +#endif // defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0) | ||
| 8137 | + | ||
| 8138 | + | ||
| 8139 | +#if __OPENCL_C_VERSION__ == CL_VERSION_3_0 | ||
| 8140 | + #ifdef __opencl_c_3d_image_writes | ||
| 8141 | + #error Feature __opencl_c_3d_image_writes shouldn't be defined | ||
| 8142 | + #endif | ||
| 8143 | + | ||
| 8144 | + #ifdef __opencl_c_atomic_order_acq_rel | ||
| 8145 | + #error Feature __opencl_c_atomic_order_acq_rel shouldn't be defined | ||
| 8146 | + #endif | ||
| 8147 | + | ||
| 8148 | + #ifdef __opencl_c_atomic_order_seq_cst | ||
| 8149 | + #error Feature __opencl_c_atomic_order_seq_cst shouldn't be defined | ||
| 8150 | + #endif | ||
| 8151 | + | ||
| 8152 | + #ifdef __opencl_c_atomic_scope_device | ||
| 8153 | + #error Feature __opencl_c_atomic_scope_device shouldn't be defined | ||
| 8154 | + #endif | ||
| 8155 | + | ||
| 8156 | + #ifdef __opencl_c_atomic_scope_all_devices | ||
| 8157 | + #error Feature __opencl_c_atomic_scope_all_devices shouldn't be defined | ||
| 8158 | + #endif | ||
| 8159 | + | ||
| 8160 | + #ifdef __opencl_c_device_enqueue | ||
| 8161 | + #error Feature __opencl_c_device_enqueue shouldn't be defined | ||
| 8162 | + #endif | ||
| 8163 | + | ||
| 8164 | + #ifdef __opencl_c_generic_address_space | ||
| 8165 | + #error Feature __opencl_c_generic_address_space shouldn't be defined | ||
| 8166 | + #endif | ||
| 8167 | + | ||
| 8168 | + #ifdef __opencl_c_pipes | ||
| 8169 | + #error Feature __opencl_c_pipes shouldn't be defined | ||
| 8170 | + #endif | ||
| 8171 | + | ||
| 8172 | + #ifdef __opencl_c_program_scope_global_variables | ||
| 8173 | + #error Feature __opencl_c_program_scope_global_variables shouldn't be defined | ||
| 8174 | + #endif | ||
| 8175 | + | ||
| 8176 | + #ifdef __opencl_c_read_write_images | ||
| 8177 | + #error Feature __opencl_c_read_write_images shouldn't be defined | ||
| 8178 | + #endif | ||
| 8179 | + | ||
| 8180 | + #ifdef __opencl_c_subgroups | ||
| 8181 | + #error Feature __opencl_c_subgroups shouldn't be defined | ||
| 8182 | + #endif | ||
| 8183 | + | ||
| 8184 | + #ifdef __opencl_c_work_group_collective_functions | ||
| 8185 | + #error Feature __opencl_c_work_group_collective_functions shouldn't be defined | ||
| 8186 | + #endif | ||
| 8187 | + | ||
| 8188 | + #ifdef __opencl_c_fp64 | ||
| 8189 | + #error Feature __opencl_c_fp64 shouldn't be defined | ||
| 8190 | + #endif | ||
| 8191 | + | ||
| 8192 | + #ifdef __opencl_c_images | ||
| 8193 | + #error Feature __opencl_c_images shouldn't be defined | ||
| 8194 | + #endif | ||
| 8195 | +#endif // __OPENCL_C_VERSION__ == CL_VERSION_3_0 | ||
| 8196 | + | ||
| 8197 | +kernel void foo() {} | ||
| 8198 | diff --git a/clang/test/Sema/pipe_builtins_feature.cl b/clang/test/Sema/pipe_builtins_feature.cl | ||
| 8199 | new file mode 100644 | ||
| 8200 | index 000000000000..56fa94fc7705 | ||
| 8201 | --- /dev/null | ||
| 8202 | +++ b/clang/test/Sema/pipe_builtins_feature.cl | ||
| 8203 | @@ -0,0 +1,21 @@ | ||
| 8204 | +// RUN: %clang_cc1 -cl-std=CL2.0 -fsyntax-only -verify %s | ||
| 8205 | +// RUN: %clang_cc1 -cl-std=CL3.0 -fsyntax-only -verify %s | ||
| 8206 | +// RUN: %clang_cc1 -cl-std=CL3.0 -cl-ext=__opencl_c_pipes -fsyntax-only -verify %s | ||
| 8207 | + | ||
| 8208 | +#ifdef __opencl_c_pipes | ||
| 8209 | + #ifndef __opencl_c_generic_address_space | ||
| 8210 | + #error Generic address space feature must also be defined | ||
| 8211 | + #endif | ||
| 8212 | +// CHECK: expected-no-diagnostics | ||
| 8213 | +// check that pragma disable all doesn't touch feature support | ||
| 8214 | + #pragma OPENCL EXTENSION all : disable | ||
| 8215 | +#endif | ||
| 8216 | + | ||
| 8217 | +void test(read_only pipe int p, global int *ptr) { | ||
| 8218 | + reserve_id_t rid; | ||
| 8219 | +} | ||
| 8220 | + | ||
| 8221 | +#ifndef __opencl_c_pipes | ||
| 8222 | +// expected-error@-5 {{expected parameter declarator}} expected-error@-5 {{expected ')'}} expected-note@-5 {{to match this '('}} | ||
| 8223 | +// expected-error@-5 {{use of type 'reserve_id_t' requires __opencl_c_pipes extension to be enabled}} | ||
| 8224 | +#endif | ||
| 8225 | diff --git a/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl b/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8226 | index a5a838241347..dbdc5cffd073 100644 | ||
| 8227 | --- a/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8228 | +++ b/clang/test/SemaOpenCL/address-spaces-conversions-cl2.0.cl | ||
| 8229 | @@ -1,6 +1,9 @@ | ||
| 8230 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=CL2.0 | ||
| 8231 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=CL2.0 | ||
| 8232 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=CL2.0 | ||
| 8233 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8234 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8235 | +// RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space | ||
| 8236 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DCONSTANT -cl-std=clc++ | ||
| 8237 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGLOBAL -cl-std=clc++ | ||
| 8238 | // RUN: %clang_cc1 %s -ffake-address-space-map -verify -pedantic -fsyntax-only -DGENERIC -cl-std=clc++ | ||
| 8239 | diff --git a/clang/test/SemaOpenCL/address-spaces.cl b/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8240 | index e9825fd1682a..563f1e649a82 100644 | ||
| 8241 | --- a/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8242 | +++ b/clang/test/SemaOpenCL/address-spaces.cl | ||
| 8243 | @@ -1,5 +1,6 @@ | ||
| 8244 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only | ||
| 8245 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -verify -pedantic -fsyntax-only | ||
| 8246 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -cl-ext=__opencl_c_generic_address_space -verify -pedantic -fsyntax-only | ||
| 8247 | // RUN: %clang_cc1 %s -cl-std=clc++ -verify -pedantic -fsyntax-only | ||
| 8248 | |||
| 8249 | __constant int ci = 1; | ||
| 8250 | diff --git a/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl b/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8251 | index f63e2913c749..727141190a0b 100644 | ||
| 8252 | --- a/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8253 | +++ b/clang/test/SemaOpenCL/cl20-device-side-enqueue.cl | ||
| 8254 | @@ -2,6 +2,12 @@ | ||
| 8255 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir-unknown-unknown" -verify -pedantic -fsyntax-only -DB32 -DQUALS="const volatile" | ||
| 8256 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir64-unknown-unknown" -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS= | ||
| 8257 | // RUN: %clang_cc1 %s -cl-std=CL2.0 -triple "spir64-unknown-unknown" -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS="const volatile" | ||
| 8258 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -DB32 -DQUALS= | ||
| 8259 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -DB32 -DQUALS="const volatile" | ||
| 8260 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir64-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS= | ||
| 8261 | +// RUN: %clang_cc1 %s -cl-std=CL3.0 -triple "spir64-unknown-unknown" -cl-ext=__opencl_c_device_enqueue,__opencl_c_subgroups -verify -pedantic -fsyntax-only -Wconversion -DWCONV -DQUALS="const volatile" | ||
| 8262 | + | ||
| 8263 | + | ||
| 8264 | |||
| 8265 | typedef struct {int a;} ndrange_t; | ||
| 8266 | // Diagnostic tests for different overloads of enqueue_kernel from Table 6.13.17.1 of OpenCL 2.0 Spec. | ||
| 8267 | @@ -235,11 +241,17 @@ kernel void bar(global unsigned int *buf) | ||
| 8268 | kernel void foo1(global unsigned int *buf) | ||
| 8269 | { | ||
| 8270 | ndrange_t n; | ||
| 8271 | - buf[0] = get_kernel_max_sub_group_size_for_ndrange(n, ^(){}); // expected-error {{use of declaration 'get_kernel_max_sub_group_size_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8272 | + buf[0] = get_kernel_max_sub_group_size_for_ndrange(n, ^(){}); | ||
| 8273 | +#if __OPENCL_C_VERSION__ < 300 | ||
| 8274 | +// expected-error@-2 {{use of declaration 'get_kernel_max_sub_group_size_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8275 | +#endif | ||
| 8276 | } | ||
| 8277 | |||
| 8278 | kernel void bar1(global unsigned int *buf) | ||
| 8279 | { | ||
| 8280 | ndrange_t n; | ||
| 8281 | - buf[0] = get_kernel_sub_group_count_for_ndrange(n, ^(){}); // expected-error {{use of declaration 'get_kernel_sub_group_count_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8282 | + buf[0] = get_kernel_sub_group_count_for_ndrange(n, ^(){}); | ||
| 8283 | +#if __OPENCL_C_VERSION__ < 300 | ||
| 8284 | +// expected-error@-2 {{use of declaration 'get_kernel_sub_group_count_for_ndrange' requires cl_khr_subgroups extension to be enabled}} | ||
| 8285 | +#endif | ||
| 8286 | } | ||
| 8287 | diff --git a/clang/test/SemaOpenCL/forget-unsupported-builtins.cl b/clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 8288 | new file mode 100644 | ||
| 8289 | index 000000000000..14dd03e2c7db | ||
| 8290 | --- /dev/null | ||
| 8291 | +++ b/clang/test/SemaOpenCL/forget-unsupported-builtins.cl | ||
| 8292 | @@ -0,0 +1,22 @@ | ||
| 8293 | +// RUN: %clang_cc1 -cl-std=cl3.0 -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8294 | +// RUN: %clang_cc1 -cl-std=cl3.0 -fsyntax-only -cl-ext=__opencl_c_pipes,__opencl_c_generic_address_space,__opencl_c_device_enqueue -verify %s -triple spir-unknown-unknown -DFEATURES | ||
| 8295 | + | ||
| 8296 | +#ifndef FEATURES | ||
| 8297 | + // expected-no-diagnostics | ||
| 8298 | +#else | ||
| 8299 | + // expected-error@+10 {{cannot redeclare builtin function 'get_pipe_max_packets'}} | ||
| 8300 | + // expected-note@+9 {{'get_pipe_max_packets' is a builtin with type 'unsigned int ()'}} | ||
| 8301 | + // expected-error@+9 {{cannot redeclare builtin function 'to_local'}} | ||
| 8302 | + // expected-note@+8 {{'to_local' is a builtin with type 'void *(void *)'}} | ||
| 8303 | + // expected-error@+8 {{cannot redeclare builtin function 'to_global'}} | ||
| 8304 | + // expected-note@+7 {{'to_global' is a builtin with type 'void *(void *)'}} | ||
| 8305 | + // expected-error@+7 {{cannot redeclare builtin function 'get_kernel_work_group_size'}} | ||
| 8306 | + // expected-note@+6 {{'get_kernel_work_group_size' is a builtin with type 'unsigned int ()'}} | ||
| 8307 | +#endif | ||
| 8308 | + | ||
| 8309 | +int get_pipe_max_packets(int); | ||
| 8310 | +int to_local(int); | ||
| 8311 | +int to_global(int); | ||
| 8312 | +int get_kernel_work_group_size(int); | ||
| 8313 | + | ||
| 8314 | +kernel void test(global int *dst) {} | ||
| 8315 | diff --git a/clang/test/SemaOpenCL/image-features.cl b/clang/test/SemaOpenCL/image-features.cl | ||
| 8316 | new file mode 100644 | ||
| 8317 | index 000000000000..ace6913bb31e | ||
| 8318 | --- /dev/null | ||
| 8319 | +++ b/clang/test/SemaOpenCL/image-features.cl | ||
| 8320 | @@ -0,0 +1,20 @@ | ||
| 8321 | +// RUN: %clang_cc1 -cl-std=cl2.0 -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8322 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_images -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8323 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_3d_image_writes -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8324 | +// RUN: %clang_cc1 -cl-std=cl3.0 -cl-ext=__opencl_c_read_write_images -fsyntax-only -verify %s -triple spir-unknown-unknown | ||
| 8325 | + | ||
| 8326 | +#if defined(__opencl_c_read_write_images) && defined(__opencl_c_3d_image_writes) | ||
| 8327 | + // expected-no-diagnostics | ||
| 8328 | +#endif | ||
| 8329 | + | ||
| 8330 | +__kernel void write_3d_image(__write_only image3d_t i) {} | ||
| 8331 | + | ||
| 8332 | +#ifndef __opencl_c_3d_image_writes | ||
| 8333 | + // expected-error@-3 {{use of type '__write_only image3d_t' requires __opencl_c_3d_image_writes extension to be enabled}} | ||
| 8334 | +#endif | ||
| 8335 | + | ||
| 8336 | +__kernel void read_write_3d_image(__read_write image3d_t i) { } | ||
| 8337 | + | ||
| 8338 | +#ifndef __opencl_c_read_write_images | ||
| 8339 | + // expected-error@-3 {{use of type '__read_write image3d_t' requires __opencl_c_read_write_images extension to be enabled}} | ||
| 8340 | +#endif | ||
| 8341 | diff --git a/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl b/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8342 | index 36e76621d24a..38b0a04726e3 100644 | ||
| 8343 | --- a/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8344 | +++ b/clang/test/SemaOpenCL/invalid-pipe-builtin-cl2.0.cl | ||
| 8345 | @@ -1,4 +1,5 @@ | ||
| 8346 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 -cl-ext=+cl_khr_subgroups | ||
| 8347 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_subgroups,__opencl_c_pipes | ||
| 8348 | |||
| 8349 | #pragma OPENCL EXTENSION cl_khr_subgroups : enable | ||
| 8350 | |||
| 8351 | diff --git a/clang/test/SemaOpenCL/storageclass-cl20.cl b/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8352 | index 581701d2a6a5..469c526ebc30 100644 | ||
| 8353 | --- a/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8354 | +++ b/clang/test/SemaOpenCL/storageclass-cl20.cl | ||
| 8355 | @@ -1,4 +1,5 @@ | ||
| 8356 | // RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL2.0 | ||
| 8357 | +// RUN: %clang_cc1 %s -verify -pedantic -fsyntax-only -cl-std=CL3.0 -cl-ext=__opencl_c_program_scope_global_variables,__opencl_c_generic_address_space | ||
| 8358 | |||
| 8359 | int G2 = 0; | ||
| 8360 | global int G3 = 0; | ||
| 8361 | diff --git a/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp b/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8362 | index 7c63cf51ecfa..785ff93aaf85 100644 | ||
| 8363 | --- a/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8364 | +++ b/clang/utils/TableGen/ClangOpenCLBuiltinEmitter.cpp | ||
| 8365 | @@ -56,6 +56,7 @@ | ||
| 8366 | //===----------------------------------------------------------------------===// | ||
| 8367 | |||
| 8368 | #include "TableGenBackends.h" | ||
| 8369 | +#include "clang/Basic/OpenCLOptions.h" | ||
| 8370 | #include "llvm/ADT/MapVector.h" | ||
| 8371 | #include "llvm/ADT/STLExtras.h" | ||
| 8372 | #include "llvm/ADT/SmallString.h" | ||
| 8373 | @@ -69,6 +70,7 @@ | ||
| 8374 | #include "llvm/TableGen/Record.h" | ||
| 8375 | #include "llvm/TableGen/StringMatcher.h" | ||
| 8376 | #include "llvm/TableGen/TableGenBackend.h" | ||
| 8377 | +#include <numeric> | ||
| 8378 | #include <set> | ||
| 8379 | |||
| 8380 | using namespace llvm; | ||
| 8381 | @@ -228,6 +230,10 @@ private: | ||
| 8382 | // The function "tan", having the same signatures, would be mapped to the | ||
| 8383 | // same entry (<I1, I2, I3>). | ||
| 8384 | MapVector<BuiltinIndexListTy *, BuiltinTableEntries> SignatureListMap; | ||
| 8385 | + | ||
| 8386 | + // Encode all versions | ||
| 8387 | + unsigned short | ||
| 8388 | + EncodeBuiltinVersions(std::vector<Record *> BuiltinVersionsRecords) const; | ||
| 8389 | }; | ||
| 8390 | } // namespace | ||
| 8391 | |||
| 8392 | @@ -338,12 +344,10 @@ struct OpenCLBuiltinStruct { | ||
| 8393 | const bool IsConst : 1; | ||
| 8394 | // Function attribute __attribute__((convergent)) | ||
| 8395 | const bool IsConv : 1; | ||
| 8396 | + // All opencl versions encoded | ||
| 8397 | + const unsigned char AllVersions : 5; | ||
| 8398 | // OpenCL extension(s) required for this overload. | ||
| 8399 | const unsigned short Extension; | ||
| 8400 | - // First OpenCL version in which this overload was introduced (e.g. CL20). | ||
| 8401 | - const unsigned short MinVersion; | ||
| 8402 | - // First OpenCL version in which this overload was removed (e.g. CL20). | ||
| 8403 | - const unsigned short MaxVersion; | ||
| 8404 | }; | ||
| 8405 | |||
| 8406 | )"; | ||
| 8407 | @@ -510,11 +514,9 @@ void BuiltinNameEmitter::EmitBuiltinTable() { | ||
| 8408 | << (Overload.first->getValueAsBit("IsPure")) << ", " | ||
| 8409 | << (Overload.first->getValueAsBit("IsConst")) << ", " | ||
| 8410 | << (Overload.first->getValueAsBit("IsConv")) << ", " | ||
| 8411 | - << FunctionExtensionIndex[ExtName] << ", " | ||
| 8412 | - << Overload.first->getValueAsDef("MinVersion")->getValueAsInt("ID") | ||
| 8413 | - << ", " | ||
| 8414 | - << Overload.first->getValueAsDef("MaxVersion")->getValueAsInt("ID") | ||
| 8415 | - << " },\n"; | ||
| 8416 | + << EncodeBuiltinVersions( | ||
| 8417 | + Overload.first->getValueAsListOfDefs("Versions")) | ||
| 8418 | + << ", " << FunctionExtensionIndex[ExtName] << " },\n"; | ||
| 8419 | Index++; | ||
| 8420 | } | ||
| 8421 | } | ||
| 8422 | @@ -535,10 +537,8 @@ bool BuiltinNameEmitter::CanReuseSignature( | ||
| 8423 | if (Rec->getValueAsBit("IsPure") == Rec2->getValueAsBit("IsPure") && | ||
| 8424 | Rec->getValueAsBit("IsConst") == Rec2->getValueAsBit("IsConst") && | ||
| 8425 | Rec->getValueAsBit("IsConv") == Rec2->getValueAsBit("IsConv") && | ||
| 8426 | - Rec->getValueAsDef("MinVersion")->getValueAsInt("ID") == | ||
| 8427 | - Rec2->getValueAsDef("MinVersion")->getValueAsInt("ID") && | ||
| 8428 | - Rec->getValueAsDef("MaxVersion")->getValueAsInt("ID") == | ||
| 8429 | - Rec2->getValueAsDef("MaxVersion")->getValueAsInt("ID") && | ||
| 8430 | + EncodeBuiltinVersions(Rec->getValueAsListOfDefs("Versions")) == | ||
| 8431 | + EncodeBuiltinVersions(Rec2->getValueAsListOfDefs("Versions")) && | ||
| 8432 | Rec->getValueAsDef("Extension")->getName() == | ||
| 8433 | Rec2->getValueAsDef("Extension")->getName()) { | ||
| 8434 | return true; | ||
| 8435 | @@ -814,6 +814,15 @@ static void OCL2Qual(ASTContext &Context, const OpenCLTypeStruct &Ty, | ||
| 8436 | OS << "\n} // OCL2Qual\n"; | ||
| 8437 | } | ||
| 8438 | |||
| 8439 | +unsigned short BuiltinNameEmitter::EncodeBuiltinVersions( | ||
| 8440 | + std::vector<Record *> BuiltinVersionsRecords) const { | ||
| 8441 | + return std::accumulate( | ||
| 8442 | + BuiltinVersionsRecords.begin(), BuiltinVersionsRecords.end(), | ||
| 8443 | + (unsigned short)0, [](unsigned short C, Record *R) { | ||
| 8444 | + return C |= clang::OpenCLOptions::EncodeVersion(R->getValueAsInt("ID")); | ||
| 8445 | + }); | ||
| 8446 | +} | ||
| 8447 | + | ||
| 8448 | void clang::EmitClangOpenCLBuiltins(RecordKeeper &Records, raw_ostream &OS) { | ||
| 8449 | BuiltinNameEmitter NameChecker(Records, OS); | ||
| 8450 | NameChecker.Emit(); | ||
| 8451 | -- | ||
| 8452 | 2.17.1 | ||
| 8453 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-Remove-repo-name-in-LLVM-IR.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-Remove-repo-name-in-LLVM-IR.patch deleted file mode 100644 index 09089432..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-Remove-repo-name-in-LLVM-IR.patch +++ /dev/null | |||
| @@ -1,50 +0,0 @@ | |||
| 1 | From ff0a6da84b94c16c4519c649f1f7bed3cdf89bbb Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Feng Zou <feng.zou@intel.com> | ||
| 3 | Date: Tue, 20 Oct 2020 11:29:04 +0800 | ||
| 4 | Subject: [PATCH] Remove repo name in LLVM IR | ||
| 5 | |||
| 6 | Upstream-Status: Backport [Taken from opencl-clang patches, https://github.com/intel/opencl-clang/blob/ocl-open-110/patches/llvm/0002-Remove-repo-name-in-LLVM-IR.patch] | ||
| 7 | Signed-off-by: Feng Zou <feng.zou@intel.com> | ||
| 8 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 9 | |||
| 10 | --- | ||
| 11 | llvm/cmake/modules/VersionFromVCS.cmake | 23 ++++++++++++----------- | ||
| 12 | 1 file changed, 12 insertions(+), 11 deletions(-) | ||
| 13 | |||
| 14 | diff --git a/llvm/cmake/modules/VersionFromVCS.cmake b/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 15 | index 18edbeabe3e..2d965263478 100644 | ||
| 16 | --- a/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 17 | +++ b/llvm/cmake/modules/VersionFromVCS.cmake | ||
| 18 | @@ -33,17 +33,18 @@ function(get_source_info path revision repository) | ||
| 19 | else() | ||
| 20 | set(remote "origin") | ||
| 21 | endif() | ||
| 22 | - execute_process(COMMAND ${GIT_EXECUTABLE} remote get-url ${remote} | ||
| 23 | - WORKING_DIRECTORY ${path} | ||
| 24 | - RESULT_VARIABLE git_result | ||
| 25 | - OUTPUT_VARIABLE git_output | ||
| 26 | - ERROR_QUIET) | ||
| 27 | - if(git_result EQUAL 0) | ||
| 28 | - string(STRIP "${git_output}" git_output) | ||
| 29 | - set(${repository} ${git_output} PARENT_SCOPE) | ||
| 30 | - else() | ||
| 31 | - set(${repository} ${path} PARENT_SCOPE) | ||
| 32 | - endif() | ||
| 33 | + # Do not show repo name in IR | ||
| 34 | + # execute_process(COMMAND ${GIT_EXECUTABLE} remote get-url ${remote} | ||
| 35 | + # WORKING_DIRECTORY ${path} | ||
| 36 | + # RESULT_VARIABLE git_result | ||
| 37 | + # OUTPUT_VARIABLE git_output | ||
| 38 | + # ERROR_QUIET) | ||
| 39 | + # if(git_result EQUAL 0) | ||
| 40 | + # string(STRIP "${git_output}" git_output) | ||
| 41 | + # set(${repository} ${git_output} PARENT_SCOPE) | ||
| 42 | + # else() | ||
| 43 | + # set(${repository} ${path} PARENT_SCOPE) | ||
| 44 | + # endif() | ||
| 45 | endif() | ||
| 46 | else() | ||
| 47 | message(WARNING "Git not found. Version cannot be determined.") | ||
| 48 | -- | ||
| 49 | 2.18.1 | ||
| 50 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-skip-building-tests.patch b/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-skip-building-tests.patch deleted file mode 100644 index 011c09ee..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/files/llvm11-skip-building-tests.patch +++ /dev/null | |||
| @@ -1,51 +0,0 @@ | |||
| 1 | From d362652617c5e840089273df0c6623a9745c92a2 Mon Sep 17 00:00:00 2001 | ||
| 2 | From: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 3 | Date: Wed, 21 Aug 2019 14:35:31 +0800 | ||
| 4 | Subject: [PATCH] llvm-spirv: skip building tests | ||
| 5 | |||
| 6 | Some of these need clang to be built and since we're building this in-tree, | ||
| 7 | that leads to problems when compiling libcxx, compiler-rt which aren't built | ||
| 8 | in-tree. | ||
| 9 | |||
| 10 | Instead of using SPIRV_SKIP_CLANG_BUILD to skip clang build and adding this to | ||
| 11 | all components, disable the building of tests altogether. | ||
| 12 | |||
| 13 | Upstream-Status: Inappropriate | ||
| 14 | |||
| 15 | Signed-off-by: Anuj Mittal <anuj.mittal@intel.com> | ||
| 16 | Signed-off-by: Naveen Saini <naveen.kumar.saini@intel.com> | ||
| 17 | --- | ||
| 18 | CMakeLists.txt | 10 ---------- | ||
| 19 | 1 file changed, 10 deletions(-) | ||
| 20 | |||
| 21 | diff --git a/CMakeLists.txt b/CMakeLists.txt | ||
| 22 | index ecebb4cb..578ca602 100644 | ||
| 23 | --- a/CMakeLists.txt | ||
| 24 | +++ b/CMakeLists.txt | ||
| 25 | @@ -25,13 +25,6 @@ if(LLVM_SPIRV_BUILD_EXTERNAL) | ||
| 26 | set(CMAKE_CXX_STANDARD 14) | ||
| 27 | set(CMAKE_CXX_STANDARD_REQUIRED ON) | ||
| 28 | |||
| 29 | - if(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 30 | - set(LLVM_TEST_COMPONENTS | ||
| 31 | - llvm-as | ||
| 32 | - llvm-dis | ||
| 33 | - ) | ||
| 34 | - endif(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 35 | - | ||
| 36 | find_package(LLVM ${BASE_LLVM_VERSION} REQUIRED | ||
| 37 | COMPONENTS | ||
| 38 | Analysis | ||
| 39 | @@ -62,9 +55,6 @@ set(LLVM_SPIRV_INCLUDE_DIRS ${CMAKE_CURRENT_SOURCE_DIR}/include) | ||
| 40 | |||
| 41 | add_subdirectory(lib/SPIRV) | ||
| 42 | add_subdirectory(tools/llvm-spirv) | ||
| 43 | -if(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 44 | - add_subdirectory(test) | ||
| 45 | -endif(LLVM_SPIRV_INCLUDE_TESTS) | ||
| 46 | |||
| 47 | install( | ||
| 48 | FILES | ||
| 49 | -- | ||
| 50 | 2.26.2 | ||
| 51 | |||
| diff --git a/dynamic-layers/clang-layer/recipes-devtools/clang/llvm-project-source.bbappend b/dynamic-layers/clang-layer/recipes-devtools/clang/llvm-project-source.bbappend deleted file mode 100644 index 4e2bc535..00000000 --- a/dynamic-layers/clang-layer/recipes-devtools/clang/llvm-project-source.bbappend +++ /dev/null | |||
| @@ -1,35 +0,0 @@ | |||
| 1 | FILESEXTRAPATHS_prepend_intel-x86-common := "${THISDIR}/files:" | ||
| 2 | |||
| 3 | SPIRV_BRANCH = "${@bb.utils.contains('LLVMVERSION', '10.0.1', 'llvm_release_100', 'llvm_release_110', d)}" | ||
| 4 | |||
| 5 | SPIRV10_SRCREV = "576abae62cecd171992017a4a786e3831221ab8d" | ||
| 6 | SPIRV11_SRCREV = "2a8c1e6c9778deaa720a23e08c293006dc5d56fd" | ||
| 7 | |||
| 8 | SPIRV_SRCREV = "${@bb.utils.contains('LLVMVERSION', '10.0.1', '${SPIRV10_SRCREV}', '${SPIRV11_SRCREV}', d)}" | ||
| 9 | |||
| 10 | SRC_URI_LLVM10 = " \ | ||
| 11 | file://llvm10-skip-building-tests.patch;patchdir=llvm/projects/llvm-spirv \ | ||
| 12 | file://fix-shared-libs.patch;patchdir=llvm/projects/llvm-spirv \ | ||
| 13 | file://BasicBlockUtils-Add-metadata-fixing-in-SplitBlockPre.patch;patchdir=llvm \ | ||
| 14 | file://IndVarSimplify-Do-not-use-SCEV-expander-for-IVCount-.patch;patchdir=llvm \ | ||
| 15 | file://llvm10-OpenCL-3.0-support.patch \ | ||
| 16 | file://0002-Add-cl_khr_extended_subgroup-extensions.patch \ | ||
| 17 | file://0001-Memory-leak-fix-for-Managed-Static-Mutex.patch \ | ||
| 18 | file://llvm10-Remove-repo-name-in-LLVM-IR.patch \ | ||
| 19 | file://0001-Fix-debug-info-of-work-item-builtin-translation-745.patch;patchdir=llvm/projects/llvm-spirv \ | ||
| 20 | " | ||
| 21 | |||
| 22 | SRC_URI_LLVM11 = " \ | ||
| 23 | file://llvm11-skip-building-tests.patch;patchdir=llvm/projects/llvm-spirv \ | ||
| 24 | file://llvm11-OpenCL-3.0-support.patch \ | ||
| 25 | file://0001-Memory-leak-fix-for-Managed-Static-Mutex.patch \ | ||
| 26 | file://llvm11-Remove-repo-name-in-LLVM-IR.patch \ | ||
| 27 | " | ||
| 28 | |||
| 29 | SPIRV_LLVM_SRC_URI = "git://github.com/KhronosGroup/SPIRV-LLVM-Translator.git;protocol=https;branch=${SPIRV_BRANCH};destsuffix=git/llvm/projects/llvm-spirv;name=spirv" | ||
| 30 | |||
| 31 | SPIRV_LLVM_PATCHES = "${@bb.utils.contains('LLVMVERSION', '10.0.1', '${SRC_URI_LLVM10}', '${SRC_URI_LLVM11}', d)}" | ||
| 32 | |||
| 33 | |||
| 34 | SRC_URI_append_intel-x86-common = "${@bb.utils.contains('LLVMVERSION', '12.0.0', '', ' ${SPIRV_LLVM_SRC_URI} ${SPIRV_LLVM_PATCHES} ', d)}" | ||
| 35 | SRCREV_spirv = "${@bb.utils.contains('LLVMVERSION', '12.0.0', '', '${SPIRV_SRCREV}', d)}" | ||
