diff options
| author | Justin Holewinski <jholewinski@nvidia.com> | 2012-05-04 20:18:50 +0000 |
|---|---|---|
| committer | Justin Holewinski <jholewinski@nvidia.com> | 2012-05-04 20:18:50 +0000 |
| commit | ae556d3ef72dfe5f40a337b7071f42b7bf5b66a4 (patch) | |
| tree | 14ad103ff9863d609096fcf56552790c407f13d5 /llvm/test/CodeGen/NVPTX/convert-int-sm20.ll | |
| parent | 2420e8b7d591acce85b253f4b234c1a8c05fa5e6 (diff) | |
| download | bcm5719-llvm-ae556d3ef72dfe5f40a337b7071f42b7bf5b66a4.tar.gz bcm5719-llvm-ae556d3ef72dfe5f40a337b7071f42b7bf5b66a4.zip | |
This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it.
The new target machines are:
nvptx (old ptx32) => 32-bit PTX
nvptx64 (old ptx64) => 64-bit PTX
The sources are based on the internal NVIDIA NVPTX back-end, and
contain more functionality than the current PTX back-end currently
provides.
NV_CONTRIB
llvm-svn: 156196
Diffstat (limited to 'llvm/test/CodeGen/NVPTX/convert-int-sm20.ll')
| -rw-r--r-- | llvm/test/CodeGen/NVPTX/convert-int-sm20.ll | 64 |
1 files changed, 64 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/NVPTX/convert-int-sm20.ll b/llvm/test/CodeGen/NVPTX/convert-int-sm20.ll new file mode 100644 index 00000000000..fad240e03d2 --- /dev/null +++ b/llvm/test/CodeGen/NVPTX/convert-int-sm20.ll @@ -0,0 +1,64 @@ +; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s +; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s + + +;; Integer conversions happen inplicitly by loading/storing the proper types + + +; i16 + +define i16 @cvt_i16_i32(i32 %x) { +; CHECK: ld.param.u16 %rs[[R0:[0-9]+]], [cvt_i16_i32_param_{{[0-9]+}}] +; CHECK: st.param.b16 [func_retval{{[0-9]+}}+0], %rs[[R0]] +; CHECK: ret + %a = trunc i32 %x to i16 + ret i16 %a +} + +define i16 @cvt_i16_i64(i64 %x) { +; CHECK: ld.param.u16 %rs[[R0:[0-9]+]], [cvt_i16_i64_param_{{[0-9]+}}] +; CHECK: st.param.b16 [func_retval{{[0-9]+}}+0], %rs[[R0]] +; CHECK: ret + %a = trunc i64 %x to i16 + ret i16 %a +} + + + +; i32 + +define i32 @cvt_i32_i16(i16 %x) { +; CHECK: ld.param.u16 %r[[R0:[0-9]+]], [cvt_i32_i16_param_{{[0-9]+}}] +; CHECK: st.param.b32 [func_retval{{[0-9]+}}+0], %r[[R0]] +; CHECK: ret + %a = zext i16 %x to i32 + ret i32 %a +} + +define i32 @cvt_i32_i64(i64 %x) { +; CHECK: ld.param.u32 %r[[R0:[0-9]+]], [cvt_i32_i64_param_{{[0-9]+}}] +; CHECK: st.param.b32 [func_retval{{[0-9]+}}+0], %r[[R0]] +; CHECK: ret + %a = trunc i64 %x to i32 + ret i32 %a +} + + + +; i64 + +define i64 @cvt_i64_i16(i16 %x) { +; CHECK: ld.param.u16 %rl[[R0:[0-9]+]], [cvt_i64_i16_param_{{[0-9]+}}] +; CHECK: st.param.b64 [func_retval{{[0-9]+}}+0], %rl[[R0]] +; CHECK: ret + %a = zext i16 %x to i64 + ret i64 %a +} + +define i64 @cvt_i64_i32(i32 %x) { +; CHECK: ld.param.u32 %rl[[R0:[0-9]+]], [cvt_i64_i32_param_{{[0-9]+}}] +; CHECK: st.param.b64 [func_retval{{[0-9]+}}+0], %rl[[R0]] +; CHECK: ret + %a = zext i32 %x to i64 + ret i64 %a +} |

