From dbde936c3c0a11ecd986df6587719739bf2a1175 Mon Sep 17 00:00:00 2001 From: Evghenii Date: Tue, 12 Nov 2013 16:47:47 +0100 Subject: [PATCH] bugfix in inlined ptx, now NVCC also compiles the ptx --- builtins/target-nvptx64.ll | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/builtins/target-nvptx64.ll b/builtins/target-nvptx64.ll index 7b469307..e60c8f05 100644 --- a/builtins/target-nvptx64.ll +++ b/builtins/target-nvptx64.ll @@ -110,11 +110,11 @@ module asm " .param .b64 cudaLaunchDevice_param_5 ); " -define i8* @ISPCAlloc(i8**, i64, i32) nounwind alwaysinline builtin +define i8* @ISPCAlloc(i8**, i64, i32) nounwind alwaysinline { ret i8* null } -define void @ISPCLaunch(i8**, i8* %func_ptr, i8** %func_args, i32 %ntx, i32 %nty, i32 %ntz) builtin +define void @ISPCLaunch(i8**, i8* %func_ptr, i8** %func_args, i32 %ntx, i32 %nty, i32 %ntz) nounwind alwaysinline { %func_i64 = ptrtoint i8* %func_ptr to i64 %args_i64 = ptrtoint i8** %func_args to i64 @@ -155,6 +155,7 @@ define void @ISPCLaunch(i8**, i8* %func_ptr, i8** %func_args, i32 %ntx, i32 %nty param5 ); ld.param.b32 $0, [retval0+0]; + } ", "=r, l,l, r,r,r, r,r,r, r,l"(i64 %func_i64,i64 %args_i64, i32 %nbx,i32 %nty,i32 %ntz, i32 128,i32 1,i32 1, i32 0,i64 0); ret void