amdgpu,nvptx: unify kernel calling conventions

AmdgpuKernel and NvptxKernel are unified into a Kernel calling convention. There is really no reason for these to be separate; no backend is allowed to emit the calling convention of the other. This is in the same spirit as the .Interrupt calling convention lowering to different LLVM calling conventions, and opens the way for SPIR-V kernels to be exported using the Kernel calling convention.
2023-04-08 14:17:34 +02:00
parent 3f2025f59e
commit f12beb857a
6 changed files with 27 additions and 30 deletions
--- a/test/nvptx.zig
+++ b/test/nvptx.zig
@@ -10,7 +10,7 @@ pub fn addCases(ctx: *Cases) !void {
            \\    return a + b;
            \\}
            \\
-            \\pub export fn add_and_substract(a: i32, out: *i32) callconv(.PtxKernel) void {
+            \\pub export fn add_and_substract(a: i32, out: *i32) callconv(.Kernel) void {
            \\    const x = add(a, 7);
            \\    var y = add(2, 0);
            \\    y -= x;
@@ -29,7 +29,7 @@ pub fn addCases(ctx: *Cases) !void {
            \\    );
            \\}
            \\
-            \\pub export fn special_reg(a: []const i32, out: []i32) callconv(.PtxKernel) void {
+            \\pub export fn special_reg(a: []const i32, out: []i32) callconv(.Kernel) void {
            \\    const i = threadIdX();
            \\    out[i] = a[i] + 7;
            \\}
@@ -42,7 +42,7 @@ pub fn addCases(ctx: *Cases) !void {
        case.addCompile(
            \\var x: i32 addrspace(.global) = 0;
            \\
-            \\pub export fn increment(out: *i32) callconv(.PtxKernel) void {
+            \\pub export fn increment(out: *i32) callconv(.Kernel) void {
            \\    x += 1;
            \\    out.* = x;
            \\}
@@ -59,7 +59,7 @@ pub fn addCases(ctx: *Cases) !void {
            \\}
            \\
            \\ var _sdata: [1024]f32 addrspace(.shared) = undefined;
-            \\ pub export fn reduceSum(d_x: []const f32, out: *f32) callconv(.PtxKernel) void {
+            \\ pub export fn reduceSum(d_x: []const f32, out: *f32) callconv(.Kernel) void {
            \\     var sdata = @addrSpaceCast(.generic, &_sdata);
            \\     const tid: u32 = threadIdX();
            \\     var sum = d_x[tid];