summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--libclc/amdgcn-amdhsa/lib/OVERRIDES3
-rw-r--r--libclc/amdgcn/lib/OVERRIDES_3.93
-rw-r--r--libclc/amdgcn/lib/SOURCES_3.93
-rw-r--r--libclc/amdgcn/lib/workitem/get_global_size.39.ll18
-rw-r--r--libclc/amdgcn/lib/workitem/get_local_size.39.ll18
-rw-r--r--libclc/amdgcn/lib/workitem/get_num_groups.39.ll18
-rw-r--r--libclc/amdgpu/lib/SOURCES_3.92
-rwxr-xr-xlibclc/configure.py20
-rw-r--r--libclc/utils/prepare-builtins.cpp9
9 files changed, 90 insertions, 4 deletions
diff --git a/libclc/amdgcn-amdhsa/lib/OVERRIDES b/libclc/amdgcn-amdhsa/lib/OVERRIDES
index c9bd69b76eb..e4dfca11c8a 100644
--- a/libclc/amdgcn-amdhsa/lib/OVERRIDES
+++ b/libclc/amdgcn-amdhsa/lib/OVERRIDES
@@ -1 +1,4 @@
workitem/get_num_groups.ll
+workitem/get_global_size.39.ll
+workitem/get_local_size.39.ll
+workitem/get_num_groups.39.ll
diff --git a/libclc/amdgcn/lib/OVERRIDES_3.9 b/libclc/amdgcn/lib/OVERRIDES_3.9
new file mode 100644
index 00000000000..f26fbbe9934
--- /dev/null
+++ b/libclc/amdgcn/lib/OVERRIDES_3.9
@@ -0,0 +1,3 @@
+workitem/get_global_size.ll
+workitem/get_local_size.ll
+workitem/get_num_groups.ll
diff --git a/libclc/amdgcn/lib/SOURCES_3.9 b/libclc/amdgcn/lib/SOURCES_3.9
new file mode 100644
index 00000000000..6ee7cb8184f
--- /dev/null
+++ b/libclc/amdgcn/lib/SOURCES_3.9
@@ -0,0 +1,3 @@
+workitem/get_global_size.39.ll
+workitem/get_local_size.39.ll
+workitem/get_num_groups.39.ll
diff --git a/libclc/amdgcn/lib/workitem/get_global_size.39.ll b/libclc/amdgcn/lib/workitem/get_global_size.39.ll
new file mode 100644
index 00000000000..d51def36bf8
--- /dev/null
+++ b/libclc/amdgcn/lib/workitem/get_global_size.39.ll
@@ -0,0 +1,18 @@
+declare i32 @llvm.r600.read.global.size.x() nounwind readnone
+declare i32 @llvm.r600.read.global.size.y() nounwind readnone
+declare i32 @llvm.r600.read.global.size.z() nounwind readnone
+
+define i32 @get_global_size(i32 %dim) nounwind readnone alwaysinline {
+ switch i32 %dim, label %default [i32 0, label %x_dim i32 1, label %y_dim i32 2, label %z_dim]
+x_dim:
+ %x = call i32 @llvm.r600.read.global.size.x()
+ ret i32 %x
+y_dim:
+ %y = call i32 @llvm.r600.read.global.size.y()
+ ret i32 %y
+z_dim:
+ %z = call i32 @llvm.r600.read.global.size.z()
+ ret i32 %z
+default:
+ ret i32 1
+}
diff --git a/libclc/amdgcn/lib/workitem/get_local_size.39.ll b/libclc/amdgcn/lib/workitem/get_local_size.39.ll
new file mode 100644
index 00000000000..92c6d268e82
--- /dev/null
+++ b/libclc/amdgcn/lib/workitem/get_local_size.39.ll
@@ -0,0 +1,18 @@
+declare i32 @llvm.r600.read.local.size.x() nounwind readnone
+declare i32 @llvm.r600.read.local.size.y() nounwind readnone
+declare i32 @llvm.r600.read.local.size.z() nounwind readnone
+
+define i32 @get_local_size(i32 %dim) nounwind readnone alwaysinline {
+ switch i32 %dim, label %default [i32 0, label %x_dim i32 1, label %y_dim i32 2, label %z_dim]
+x_dim:
+ %x = call i32 @llvm.r600.read.local.size.x()
+ ret i32 %x
+y_dim:
+ %y = call i32 @llvm.r600.read.local.size.y()
+ ret i32 %y
+z_dim:
+ %z = call i32 @llvm.r600.read.local.size.z()
+ ret i32 %z
+default:
+ ret i32 1
+}
diff --git a/libclc/amdgcn/lib/workitem/get_num_groups.39.ll b/libclc/amdgcn/lib/workitem/get_num_groups.39.ll
new file mode 100644
index 00000000000..fd5c17cccb8
--- /dev/null
+++ b/libclc/amdgcn/lib/workitem/get_num_groups.39.ll
@@ -0,0 +1,18 @@
+declare i32 @llvm.r600.read.ngroups.x() nounwind readnone
+declare i32 @llvm.r600.read.ngroups.y() nounwind readnone
+declare i32 @llvm.r600.read.ngroups.z() nounwind readnone
+
+define i32 @get_num_groups(i32 %dim) nounwind readnone alwaysinline {
+ switch i32 %dim, label %default [i32 0, label %x_dim i32 1, label %y_dim i32 2, label %z_dim]
+x_dim:
+ %x = call i32 @llvm.r600.read.ngroups.x()
+ ret i32 %x
+y_dim:
+ %y = call i32 @llvm.r600.read.ngroups.y()
+ ret i32 %y
+z_dim:
+ %z = call i32 @llvm.r600.read.ngroups.z()
+ ret i32 %z
+default:
+ ret i32 1
+}
diff --git a/libclc/amdgpu/lib/SOURCES_3.9 b/libclc/amdgpu/lib/SOURCES_3.9
new file mode 100644
index 00000000000..69c5e5ce9fb
--- /dev/null
+++ b/libclc/amdgpu/lib/SOURCES_3.9
@@ -0,0 +1,2 @@
+shared/vload_half_helpers.ll
+shared/vstore_half_helpers.ll
diff --git a/libclc/configure.py b/libclc/configure.py
index 4e7a32c5608..00d1ecbc223 100755
--- a/libclc/configure.py
+++ b/libclc/configure.py
@@ -72,8 +72,8 @@ llvm_version = llvm_config(['--version']).replace('svn', '').split('.')
llvm_int_version = int(llvm_version[0]) * 100 + int(llvm_version[1]) * 10
llvm_string_version = llvm_version[0] + '.' + llvm_version[1]
-if llvm_int_version < 400:
- print("libclc requires LLVM >= 4.0")
+if llvm_int_version < 390:
+ print("libclc requires LLVM >= 3.9")
sys.exit(1)
llvm_system_libs = llvm_config(['--system-libs'])
@@ -109,9 +109,13 @@ available_targets = {
'nvptx64--nvidiacl' : { 'devices' : [{'gpu' : '', 'aliases' : []} ]},
}
-available_targets['amdgcn-mesa-mesa3d'] = available_targets['amdgcn--']
-default_targets = ['nvptx--nvidiacl', 'nvptx64--nvidiacl', 'r600--', 'amdgcn--', 'amdgcn--amdhsa', 'amdgcn-mesa-mesa3d']
+default_targets = ['nvptx--nvidiacl', 'nvptx64--nvidiacl', 'r600--', 'amdgcn--', 'amdgcn--amdhsa']
+
+#mesa is using amdgcn-mesa-mesa3d since llvm-4.0
+if llvm_int_version > 390:
+ available_targets['amdgcn-mesa-mesa3d'] = available_targets['amdgcn--']
+ default_targets.append('amdgcn-mesa-mesa3d')
targets = args
if not targets:
@@ -218,6 +222,8 @@ for target in targets:
override_list_file = os.path.join(libdir, 'OVERRIDES')
compat_list_file = os.path.join(libdir,
'SOURCES_' + llvm_string_version)
+ compat_list_override = os.path.join(libdir,
+ 'OVERRIDES_' + llvm_string_version)
# Build compat list
if os.path.exists(compat_list_file):
@@ -225,6 +231,12 @@ for target in targets:
compat = compat.rstrip()
compats.append(compat)
+ # Add target compat overrides
+ if os.path.exists(compat_list_override):
+ for override in open(compat_list_override).readlines():
+ override = override.rstrip()
+ sources_seen.add(override)
+
# Add target overrides
if os.path.exists(override_list_file):
for override in open(override_list_file).readlines():
diff --git a/libclc/utils/prepare-builtins.cpp b/libclc/utils/prepare-builtins.cpp
index 5cd32cdb248..0f03e050a3d 100644
--- a/libclc/utils/prepare-builtins.cpp
+++ b/libclc/utils/prepare-builtins.cpp
@@ -1,5 +1,10 @@
+#if HAVE_LLVM > 0x0390
#include "llvm/Bitcode/BitcodeReader.h"
#include "llvm/Bitcode/BitcodeWriter.h"
+#else
+#include "llvm/Bitcode/ReaderWriter.h"
+#endif
+
#include "llvm/IR/Function.h"
#include "llvm/IR/GlobalVariable.h"
#include "llvm/IR/LLVMContext.h"
@@ -41,8 +46,12 @@ int main(int argc, char **argv) {
} else {
std::unique_ptr<MemoryBuffer> &BufferPtr = BufferOrErr.get();
ErrorOr<std::unique_ptr<Module>> ModuleOrErr =
+#if HAVE_LLVM > 0x0390
expectedToErrorOrAndEmitErrors(Context,
parseBitcodeFile(BufferPtr.get()->getMemBufferRef(), Context));
+#else
+ parseBitcodeFile(BufferPtr.get()->getMemBufferRef(), Context);
+#endif
if (std::error_code ec = ModuleOrErr.getError())
ErrorMessage = ec.message();
OpenPOWER on IntegriCloud