Commit 031c768cc8
Changed files (7)
src/arch/aarch64/abi.zig
@@ -5,7 +5,14 @@ const Register = bits.Register;
const RegisterManagerFn = @import("../../register_manager.zig").RegisterManager;
const Type = @import("../../type.zig").Type;
-pub const Class = union(enum) { memory, integer, double_integer, none, float_array: u8 };
+pub const Class = union(enum) {
+ memory,
+ byval,
+ integer,
+ double_integer,
+ none,
+ float_array: u8,
+};
/// For `float_array` the second element will be the amount of floats.
pub fn classifyType(ty: Type, target: std.Target) Class {
@@ -13,7 +20,7 @@ pub fn classifyType(ty: Type, target: std.Target) Class {
var maybe_float_bits: ?u16 = null;
switch (ty.zigTypeTag()) {
.Struct => {
- if (ty.containerLayout() == .Packed) return .integer;
+ if (ty.containerLayout() == .Packed) return .byval;
const float_count = countFloats(ty, target, &maybe_float_bits);
if (float_count <= sret_float_count) return .{ .float_array = float_count };
@@ -23,7 +30,7 @@ pub fn classifyType(ty: Type, target: std.Target) Class {
return .integer;
},
.Union => {
- if (ty.containerLayout() == .Packed) return .integer;
+ if (ty.containerLayout() == .Packed) return .byval;
const float_count = countFloats(ty, target, &maybe_float_bits);
if (float_count <= sret_float_count) return .{ .float_array = float_count };
@@ -32,14 +39,20 @@ pub fn classifyType(ty: Type, target: std.Target) Class {
if (bit_size > 64) return .double_integer;
return .integer;
},
- .Int, .Enum, .ErrorSet, .Vector, .Float, .Bool => return .integer,
+ .Int, .Enum, .ErrorSet, .Float, .Bool => return .byval,
+ .Vector => {
+ const bit_size = ty.bitSize(target);
+ // TODO is this controlled by a cpu feature?
+ if (bit_size > 128) return .memory;
+ return .byval;
+ },
.Optional => {
std.debug.assert(ty.isPtrLikeOptional());
- return .integer;
+ return .byval;
},
.Pointer => {
std.debug.assert(!ty.isSlice());
- return .integer;
+ return .byval;
},
.ErrorUnion,
.Frame,
src/arch/arm/abi.zig
@@ -21,7 +21,9 @@ pub const Class = union(enum) {
}
};
-pub fn classifyType(ty: Type, target: std.Target) Class {
+pub const Context = enum { ret, arg };
+
+pub fn classifyType(ty: Type, target: std.Target, ctx: Context) Class {
if (!ty.hasRuntimeBitsIgnoreComptime()) return .none;
var maybe_float_bits: ?u16 = null;
@@ -66,14 +68,17 @@ pub fn classifyType(ty: Type, target: std.Target) Class {
}
return Class.arrSize(bit_size, 32);
},
- .Int, .Enum => {
+ .Bool, .Float => return .byval,
+ .Int, .Enum, .ErrorSet => {
const bit_size = ty.bitSize(target);
if (bit_size > 64) return .memory;
return .byval;
},
- .ErrorSet, .Vector, .Float, .Bool => {
+ .Vector => {
const bit_size = ty.bitSize(target);
- if (bit_size > 128) return .memory;
+ // TODO is this controlled by a cpu feature?
+ if (ctx == .ret and bit_size > 128) return .memory;
+ if (bit_size > 512) return .memory;
return .byval;
},
.Optional => {
src/arch/x86_64/abi.zig
@@ -60,9 +60,11 @@ pub fn classifyWindows(ty: Type, target: Target) Class {
}
}
+pub const Context = enum { ret, arg };
+
/// There are a maximum of 8 possible return slots. Returned values are in
/// the beginning of the array; unused slots are filled with .none.
-pub fn classifySystemV(ty: Type, target: Target) [8]Class {
+pub fn classifySystemV(ty: Type, target: Target, ctx: Context) [8]Class {
const memory_class = [_]Class{
.memory, .none, .none, .none,
.none, .none, .none, .none,
@@ -134,6 +136,22 @@ pub fn classifySystemV(ty: Type, target: Target) [8]Class {
},
.Vector => {
const elem_ty = ty.childType();
+ if (ctx == .arg) {
+ const bit_size = ty.bitSize(target);
+ if (bit_size > 128) return memory_class;
+ if (bit_size > 80) return .{
+ .integer, .integer, .none, .none,
+ .none, .none, .none, .none,
+ };
+ if (bit_size > 64) return .{
+ .x87, .none, .none, .none,
+ .none, .none, .none, .none,
+ };
+ return .{
+ .integer, .none, .none, .none,
+ .none, .none, .none, .none,
+ };
+ }
const bits = elem_ty.bitSize(target) * ty.arrayLen();
if (bits <= 64) return .{
.sse, .none, .none, .none,
@@ -201,7 +219,7 @@ pub fn classifySystemV(ty: Type, target: Target) [8]Class {
}
}
const field_size = field.ty.abiSize(target);
- const field_class_array = classifySystemV(field.ty, target);
+ const field_class_array = classifySystemV(field.ty, target, .arg);
const field_class = std.mem.sliceTo(&field_class_array, .none);
if (byte_i + field_size <= 8) {
// Combine this field with the previous one.
@@ -315,7 +333,7 @@ pub fn classifySystemV(ty: Type, target: Target) [8]Class {
}
}
// Combine this field with the previous one.
- const field_class = classifySystemV(field.ty, target);
+ const field_class = classifySystemV(field.ty, target, .arg);
for (result) |*result_item, i| {
const field_item = field_class[i];
// "If both classes are equal, this is the resulting class."
src/arch/x86_64/CodeGen.zig
@@ -7143,7 +7143,7 @@ fn resolveCallingConventionValues(self: *Self, fn_ty: Type) !CallMCValues {
const classes: []const abi.Class = switch (self.target.os.tag) {
.windows => &[1]abi.Class{abi.classifyWindows(ty, self.target.*)},
- else => mem.sliceTo(&abi.classifySystemV(ty, self.target.*), .none),
+ else => mem.sliceTo(&abi.classifySystemV(ty, self.target.*, .arg), .none),
};
if (classes.len > 1) {
return self.fail("TODO handle multiple classes per type", .{});
src/codegen/llvm.zig
@@ -10110,11 +10110,11 @@ fn firstParamSRet(fn_info: Type.Payload.Function.Data, target: std.Target) bool
.mips, .mipsel => return false,
.x86_64 => switch (target.os.tag) {
.windows => return x86_64_abi.classifyWindows(fn_info.return_type, target) == .memory,
- else => return x86_64_abi.classifySystemV(fn_info.return_type, target)[0] == .memory,
+ else => return x86_64_abi.classifySystemV(fn_info.return_type, target, .ret)[0] == .memory,
},
.wasm32 => return wasm_c_abi.classifyType(fn_info.return_type, target)[0] == .indirect,
.aarch64, .aarch64_be => return aarch64_c_abi.classifyType(fn_info.return_type, target) == .memory,
- .arm, .armeb => switch (arm_c_abi.classifyType(fn_info.return_type, target)) {
+ .arm, .armeb => switch (arm_c_abi.classifyType(fn_info.return_type, target, .ret)) {
.memory, .i64_array => return true,
.i32_array => |size| return size != 1,
.none, .byval => return false,
@@ -10171,7 +10171,7 @@ fn lowerFnRetTy(dg: *DeclGen, fn_info: Type.Payload.Function.Data) !*llvm.Type {
if (is_scalar) {
return dg.lowerType(fn_info.return_type);
}
- const classes = x86_64_abi.classifySystemV(fn_info.return_type, target);
+ const classes = x86_64_abi.classifySystemV(fn_info.return_type, target, .ret);
if (classes[0] == .memory) {
return dg.context.voidType();
}
@@ -10229,12 +10229,10 @@ fn lowerFnRetTy(dg: *DeclGen, fn_info: Type.Payload.Function.Data) !*llvm.Type {
return dg.context.intType(@intCast(c_uint, abi_size * 8));
},
.aarch64, .aarch64_be => {
- if (is_scalar) {
- return dg.lowerType(fn_info.return_type);
- }
switch (aarch64_c_abi.classifyType(fn_info.return_type, target)) {
.memory, .none => return dg.context.voidType(),
.float_array => return dg.lowerType(fn_info.return_type),
+ .byval => return dg.lowerType(fn_info.return_type),
.integer => {
const bit_size = fn_info.return_type.bitSize(target);
return dg.context.intType(@intCast(c_uint, bit_size));
@@ -10243,7 +10241,7 @@ fn lowerFnRetTy(dg: *DeclGen, fn_info: Type.Payload.Function.Data) !*llvm.Type {
}
},
.arm, .armeb => {
- switch (arm_c_abi.classifyType(fn_info.return_type, target)) {
+ switch (arm_c_abi.classifyType(fn_info.return_type, target, .ret)) {
.memory, .i64_array => return dg.context.voidType(),
.i32_array => |len| if (len == 1) {
return dg.context.intType(32);
@@ -10376,18 +10374,18 @@ const ParamTypeIterator = struct {
else => unreachable,
},
else => {
- if (is_scalar) {
- it.zig_index += 1;
- it.llvm_index += 1;
- return .byval;
- }
- const classes = x86_64_abi.classifySystemV(ty, it.target);
+ const classes = x86_64_abi.classifySystemV(ty, it.target, .arg);
if (classes[0] == .memory) {
it.zig_index += 1;
it.llvm_index += 1;
it.byval_attr = true;
return .byref;
}
+ if (is_scalar) {
+ it.zig_index += 1;
+ it.llvm_index += 1;
+ return .byval;
+ }
var llvm_types_buffer: [8]u16 = undefined;
var llvm_types_index: u32 = 0;
for (classes) |class| {
@@ -10452,13 +10450,11 @@ const ParamTypeIterator = struct {
.aarch64, .aarch64_be => {
it.zig_index += 1;
it.llvm_index += 1;
- if (is_scalar) {
- return .byval;
- }
switch (aarch64_c_abi.classifyType(ty, it.target)) {
.none => unreachable,
.memory => return .byref,
.float_array => |len| return Lowering{ .float_array = len },
+ .byval => return .byval,
.integer => {
it.llvm_types_len = 1;
it.llvm_types_buffer[0] = 64;
@@ -10470,7 +10466,7 @@ const ParamTypeIterator = struct {
.arm, .armeb => {
it.zig_index += 1;
it.llvm_index += 1;
- switch (arm_c_abi.classifyType(ty, it.target)) {
+ switch (arm_c_abi.classifyType(ty, it.target, .arg)) {
.none => unreachable,
.memory => {
it.byval_attr = true;
test/c_abi/cfuncs.c
@@ -1,8 +1,8 @@
+#include <complex.h>
#include <inttypes.h>
-#include <stdlib.h>
#include <stdbool.h>
+#include <stdlib.h>
#include <string.h>
-#include <complex.h>
void zig_panic();
@@ -210,7 +210,7 @@ void run_c_tests(void) {
zig_longdouble(12.34l);
zig_five_floats(1.0f, 2.0f, 3.0f, 4.0f, 5.0f);
- zig_ptr((void*)0xdeadbeefL);
+ zig_ptr((void *)0xdeadbeefL);
zig_bool(true);
@@ -408,7 +408,7 @@ void c_long_double(long double x) {
}
void c_ptr(void *x) {
- assert_or_panic(x == (void*)0xdeadbeefL);
+ assert_or_panic(x == (void *)0xdeadbeefL);
}
void c_bool(bool x) {
@@ -676,7 +676,7 @@ void c_struct_with_array(StructWithArray x) {
}
StructWithArray c_ret_struct_with_array() {
- return (StructWithArray) { 4, {}, 155 };
+ return (StructWithArray){4, {}, 155};
}
typedef struct {
@@ -705,3 +705,31 @@ FloatArrayStruct c_ret_float_array_struct() {
x.size.height = 4;
return x;
}
+
+typedef uint32_t SmallVec __attribute__((vector_size(2 * sizeof(uint32_t))));
+
+void c_small_vec(SmallVec vec) {
+ assert_or_panic(vec[0] == 1);
+ assert_or_panic(vec[1] == 2);
+}
+
+SmallVec c_ret_small_vec(void) {
+ return (SmallVec){3, 4};
+}
+
+typedef size_t BigVec __attribute__((vector_size(8 * sizeof(size_t))));
+
+void c_big_vec(BigVec vec) {
+ assert_or_panic(vec[0] == 1);
+ assert_or_panic(vec[1] == 2);
+ assert_or_panic(vec[2] == 3);
+ assert_or_panic(vec[3] == 4);
+ assert_or_panic(vec[4] == 5);
+ assert_or_panic(vec[5] == 6);
+ assert_or_panic(vec[6] == 7);
+ assert_or_panic(vec[7] == 8);
+}
+
+BigVec c_ret_big_vec(void) {
+ return (BigVec){9, 10, 11, 12, 13, 14, 15, 16};
+}
test/c_abi/main.zig
@@ -766,3 +766,38 @@ test "Float array like struct" {
try std.testing.expect(x.size.width == 3);
try std.testing.expect(x.size.height == 4);
}
+
+const SmallVec = @Vector(2, u32);
+
+extern fn c_small_vec(SmallVec) void;
+extern fn c_ret_small_vec() SmallVec;
+
+test "small simd vector" {
+ if (builtin.cpu.arch == .i386) return error.SkipZigTest;
+ if (comptime builtin.cpu.arch.isRISCV()) return error.SkipZigTest;
+
+ c_small_vec(.{ 1, 2 });
+
+ var x = c_ret_small_vec();
+ try std.testing.expect(x[0] == 3);
+ try std.testing.expect(x[1] == 4);
+}
+
+const BigVec = @Vector(8, usize);
+
+extern fn c_big_vec(BigVec) void;
+extern fn c_ret_big_vec() BigVec;
+
+test "big simd vector" {
+ c_big_vec(.{ 1, 2, 3, 4, 5, 6, 7, 8 });
+
+ var x = c_ret_big_vec();
+ try std.testing.expect(x[0] == 9);
+ try std.testing.expect(x[1] == 10);
+ try std.testing.expect(x[2] == 11);
+ try std.testing.expect(x[3] == 12);
+ try std.testing.expect(x[4] == 13);
+ try std.testing.expect(x[5] == 14);
+ try std.testing.expect(x[6] == 15);
+ try std.testing.expect(x[7] == 16);
+}