zig/src-self-hosted/value.zig

581 lines
19 KiB
Zig
Raw Normal View History

const std = @import("std");
2020-04-18 16:41:45 -07:00
const Type = @import("type.zig").Type;
const log2 = std.math.log2;
const assert = std.debug.assert;
2020-04-21 14:54:00 -07:00
const BigInt = std.math.big.Int;
2020-04-21 16:48:59 -07:00
const Target = std.Target;
const Allocator = std.mem.Allocator;
2020-04-17 21:09:43 -07:00
/// This is the raw data, with no bookkeeping, no memory awareness,
/// no de-duplication, and no type system awareness.
/// It's important for this struct to be small.
2020-04-18 16:41:45 -07:00
/// This union takes advantage of the fact that the first page of memory
/// is unmapped, giving us 4096 possible enum tags that have no payload.
pub const Value = extern union {
/// If the tag value is less than Tag.no_payload_count, then no pointer
/// dereference is needed.
tag_if_small_enough: usize,
ptr_otherwise: *Payload,
2020-04-17 21:09:43 -07:00
pub const Tag = enum {
2020-04-18 16:41:45 -07:00
// The first section of this enum are tags that require no payload.
2020-04-21 14:06:09 -07:00
u8_type,
i8_type,
isize_type,
usize_type,
c_short_type,
c_ushort_type,
c_int_type,
c_uint_type,
c_long_type,
c_ulong_type,
c_longlong_type,
c_ulonglong_type,
c_longdouble_type,
f16_type,
f32_type,
f64_type,
f128_type,
c_void_type,
bool_type,
2020-04-17 21:09:43 -07:00
void_type,
2020-04-21 14:06:09 -07:00
type_type,
anyerror_type,
comptime_int_type,
comptime_float_type,
2020-04-17 21:09:43 -07:00
noreturn_type,
2020-04-21 14:06:09 -07:00
fn_naked_noreturn_no_args_type,
2020-04-21 18:14:56 -07:00
single_const_pointer_to_comptime_int_type,
2020-04-21 14:06:09 -07:00
const_slice_u8_type,
2020-04-21 21:04:52 -07:00
zero,
2020-04-17 21:09:43 -07:00
void_value,
noreturn_value,
bool_true,
2020-04-19 17:04:11 -07:00
bool_false, // See last_no_payload_tag below.
2020-04-18 16:41:45 -07:00
// After this, the tag requires a payload.
2020-04-17 21:09:43 -07:00
2020-04-18 16:41:45 -07:00
ty,
2020-04-17 21:09:43 -07:00
int_u64,
int_i64,
2020-04-21 14:54:00 -07:00
int_big,
2020-04-17 21:09:43 -07:00
function,
ref,
2020-04-21 18:14:56 -07:00
ref_val,
2020-04-17 21:09:43 -07:00
bytes,
2020-04-19 17:04:11 -07:00
pub const last_no_payload_tag = Tag.bool_false;
pub const no_payload_count = @enumToInt(last_no_payload_tag) + 1;
};
2020-04-18 17:22:54 -07:00
pub fn initTag(comptime small_tag: Tag) Value {
comptime assert(@enumToInt(small_tag) < Tag.no_payload_count);
return .{ .tag_if_small_enough = @enumToInt(small_tag) };
2020-04-18 16:41:45 -07:00
}
2020-04-18 16:41:45 -07:00
pub fn initPayload(payload: *Payload) Value {
assert(@enumToInt(payload.tag) >= Tag.no_payload_count);
return .{ .ptr_otherwise = payload };
}
2020-04-18 16:41:45 -07:00
pub fn tag(self: Value) Tag {
if (self.tag_if_small_enough < Tag.no_payload_count) {
2020-04-19 17:04:11 -07:00
return @intToEnum(Tag, @intCast(@TagType(Tag), self.tag_if_small_enough));
2020-04-18 16:41:45 -07:00
} else {
return self.ptr_otherwise.tag;
}
}
2020-04-19 17:04:11 -07:00
pub fn cast(self: Value, comptime T: type) ?*T {
if (self.tag_if_small_enough < Tag.no_payload_count)
return null;
const expected_tag = std.meta.fieldInfo(T, "base").default_value.?.tag;
if (self.ptr_otherwise.tag != expected_tag)
return null;
return @fieldParentPtr(T, "base", self.ptr_otherwise);
}
pub fn format(
self: Value,
comptime fmt: []const u8,
options: std.fmt.FormatOptions,
out_stream: var,
) !void {
comptime assert(fmt.len == 0);
2020-04-21 18:14:56 -07:00
var val = self;
while (true) switch (val.tag()) {
2020-04-21 14:06:09 -07:00
.u8_type => return out_stream.writeAll("u8"),
.i8_type => return out_stream.writeAll("i8"),
.isize_type => return out_stream.writeAll("isize"),
.usize_type => return out_stream.writeAll("usize"),
.c_short_type => return out_stream.writeAll("c_short"),
.c_ushort_type => return out_stream.writeAll("c_ushort"),
.c_int_type => return out_stream.writeAll("c_int"),
.c_uint_type => return out_stream.writeAll("c_uint"),
.c_long_type => return out_stream.writeAll("c_long"),
.c_ulong_type => return out_stream.writeAll("c_ulong"),
.c_longlong_type => return out_stream.writeAll("c_longlong"),
.c_ulonglong_type => return out_stream.writeAll("c_ulonglong"),
.c_longdouble_type => return out_stream.writeAll("c_longdouble"),
.f16_type => return out_stream.writeAll("f16"),
.f32_type => return out_stream.writeAll("f32"),
.f64_type => return out_stream.writeAll("f64"),
.f128_type => return out_stream.writeAll("f128"),
.c_void_type => return out_stream.writeAll("c_void"),
.bool_type => return out_stream.writeAll("bool"),
2020-04-19 17:04:11 -07:00
.void_type => return out_stream.writeAll("void"),
2020-04-21 14:06:09 -07:00
.type_type => return out_stream.writeAll("type"),
.anyerror_type => return out_stream.writeAll("anyerror"),
.comptime_int_type => return out_stream.writeAll("comptime_int"),
.comptime_float_type => return out_stream.writeAll("comptime_float"),
2020-04-19 17:04:11 -07:00
.noreturn_type => return out_stream.writeAll("noreturn"),
2020-04-21 14:06:09 -07:00
.fn_naked_noreturn_no_args_type => return out_stream.writeAll("fn() callconv(.Naked) noreturn"),
2020-04-21 18:14:56 -07:00
.single_const_pointer_to_comptime_int_type => return out_stream.writeAll("*const comptime_int"),
2020-04-21 14:06:09 -07:00
.const_slice_u8_type => return out_stream.writeAll("[]const u8"),
2020-04-21 21:04:52 -07:00
.zero => return out_stream.writeAll("0"),
2020-04-19 17:04:11 -07:00
.void_value => return out_stream.writeAll("{}"),
.noreturn_value => return out_stream.writeAll("unreachable"),
.bool_true => return out_stream.writeAll("true"),
.bool_false => return out_stream.writeAll("false"),
2020-04-21 18:14:56 -07:00
.ty => return val.cast(Payload.Ty).?.ty.format("", options, out_stream),
.int_u64 => return std.fmt.formatIntValue(val.cast(Payload.Int_u64).?.int, "", options, out_stream),
.int_i64 => return std.fmt.formatIntValue(val.cast(Payload.Int_i64).?.int, "", options, out_stream),
.int_big => return out_stream.print("{}", .{val.cast(Payload.IntBig).?.big_int}),
2020-04-19 17:04:11 -07:00
.function => return out_stream.writeAll("(function)"),
.ref => return out_stream.writeAll("(ref)"),
2020-04-21 18:14:56 -07:00
.ref_val => {
try out_stream.writeAll("*const ");
val = val.cast(Payload.RefVal).?.val;
continue;
},
.bytes => return std.zig.renderStringLiteral(self.cast(Payload.Bytes).?.data, out_stream),
2020-04-21 18:14:56 -07:00
};
2020-04-19 17:04:11 -07:00
}
2020-04-20 21:56:30 -07:00
/// Asserts that the value is representable as an array of bytes.
/// Copies the value into a freshly allocated slice of memory, which is owned by the caller.
pub fn toAllocatedBytes(self: Value, allocator: *Allocator) Allocator.Error![]u8 {
2020-04-20 21:56:30 -07:00
if (self.cast(Payload.Bytes)) |bytes| {
return std.mem.dupe(allocator, u8, bytes.data);
}
unreachable;
}
2020-04-21 13:06:15 -07:00
/// Asserts that the value is representable as a type.
pub fn toType(self: Value) Type {
return switch (self.tag()) {
.ty => self.cast(Payload.Ty).?.ty,
2020-04-21 14:06:09 -07:00
.u8_type => Type.initTag(.@"u8"),
.i8_type => Type.initTag(.@"i8"),
.isize_type => Type.initTag(.@"isize"),
.usize_type => Type.initTag(.@"usize"),
.c_short_type => Type.initTag(.@"c_short"),
.c_ushort_type => Type.initTag(.@"c_ushort"),
.c_int_type => Type.initTag(.@"c_int"),
.c_uint_type => Type.initTag(.@"c_uint"),
.c_long_type => Type.initTag(.@"c_long"),
.c_ulong_type => Type.initTag(.@"c_ulong"),
.c_longlong_type => Type.initTag(.@"c_longlong"),
.c_ulonglong_type => Type.initTag(.@"c_ulonglong"),
.c_longdouble_type => Type.initTag(.@"c_longdouble"),
.f16_type => Type.initTag(.@"f16"),
.f32_type => Type.initTag(.@"f32"),
.f64_type => Type.initTag(.@"f64"),
.f128_type => Type.initTag(.@"f128"),
.c_void_type => Type.initTag(.@"c_void"),
.bool_type => Type.initTag(.@"bool"),
2020-04-21 13:06:15 -07:00
.void_type => Type.initTag(.@"void"),
2020-04-21 14:06:09 -07:00
.type_type => Type.initTag(.@"type"),
.anyerror_type => Type.initTag(.@"anyerror"),
.comptime_int_type => Type.initTag(.@"comptime_int"),
.comptime_float_type => Type.initTag(.@"comptime_float"),
2020-04-21 13:06:15 -07:00
.noreturn_type => Type.initTag(.@"noreturn"),
2020-04-21 14:06:09 -07:00
.fn_naked_noreturn_no_args_type => Type.initTag(.fn_naked_noreturn_no_args),
2020-04-21 18:14:56 -07:00
.single_const_pointer_to_comptime_int_type => Type.initTag(.single_const_pointer_to_comptime_int),
2020-04-21 14:06:09 -07:00
.const_slice_u8_type => Type.initTag(.const_slice_u8),
2020-04-21 13:06:15 -07:00
2020-04-21 21:04:52 -07:00
.zero,
2020-04-21 13:06:15 -07:00
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.int_u64,
.int_i64,
2020-04-21 14:54:00 -07:00
.int_big,
2020-04-21 13:06:15 -07:00
.function,
.ref,
2020-04-21 18:14:56 -07:00
.ref_val,
2020-04-21 13:06:15 -07:00
.bytes,
=> unreachable,
};
}
/// Asserts the value is an integer.
pub fn toBigInt(self: Value, allocator: *Allocator) Allocator.Error!BigInt {
switch (self.tag()) {
.ty,
.u8_type,
.i8_type,
.isize_type,
.usize_type,
.c_short_type,
.c_ushort_type,
.c_int_type,
.c_uint_type,
.c_long_type,
.c_ulong_type,
.c_longlong_type,
.c_ulonglong_type,
.c_longdouble_type,
.f16_type,
.f32_type,
.f64_type,
.f128_type,
.c_void_type,
.bool_type,
.void_type,
.type_type,
.anyerror_type,
.comptime_int_type,
.comptime_float_type,
.noreturn_type,
.fn_naked_noreturn_no_args_type,
.single_const_pointer_to_comptime_int_type,
.const_slice_u8_type,
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.function,
.ref,
.ref_val,
.bytes,
=> unreachable,
.zero => return BigInt.initSet(allocator, 0),
.int_u64 => return BigInt.initSet(allocator, self.cast(Payload.Int_u64).?.int),
.int_i64 => return BigInt.initSet(allocator, self.cast(Payload.Int_i64).?.int),
.int_big => return self.cast(Payload.IntBig).?.big_int,
}
}
/// Asserts the value is an integer and it fits in a u64
pub fn toUnsignedInt(self: Value) u64 {
switch (self.tag()) {
.ty,
.u8_type,
.i8_type,
.isize_type,
.usize_type,
.c_short_type,
.c_ushort_type,
.c_int_type,
.c_uint_type,
.c_long_type,
.c_ulong_type,
.c_longlong_type,
.c_ulonglong_type,
.c_longdouble_type,
.f16_type,
.f32_type,
.f64_type,
.f128_type,
.c_void_type,
.bool_type,
.void_type,
.type_type,
.anyerror_type,
.comptime_int_type,
.comptime_float_type,
.noreturn_type,
.fn_naked_noreturn_no_args_type,
.single_const_pointer_to_comptime_int_type,
.const_slice_u8_type,
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.function,
.ref,
.ref_val,
.bytes,
=> unreachable,
.zero => return 0,
.int_u64 => return self.cast(Payload.Int_u64).?.int,
.int_i64 => return @intCast(u64, self.cast(Payload.Int_u64).?.int),
.int_big => return self.cast(Payload.IntBig).?.big_int.to(u64) catch unreachable,
}
}
2020-04-21 16:48:59 -07:00
/// Asserts the value is an integer, and the destination type is ComptimeInt or Int.
pub fn intFitsInType(self: Value, ty: Type, target: Target) bool {
switch (self.tag()) {
.ty,
.u8_type,
.i8_type,
.isize_type,
.usize_type,
.c_short_type,
.c_ushort_type,
.c_int_type,
.c_uint_type,
.c_long_type,
.c_ulong_type,
.c_longlong_type,
.c_ulonglong_type,
.c_longdouble_type,
.f16_type,
.f32_type,
.f64_type,
.f128_type,
.c_void_type,
.bool_type,
.void_type,
.type_type,
.anyerror_type,
.comptime_int_type,
.comptime_float_type,
.noreturn_type,
.fn_naked_noreturn_no_args_type,
2020-04-21 18:14:56 -07:00
.single_const_pointer_to_comptime_int_type,
2020-04-21 16:48:59 -07:00
.const_slice_u8_type,
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.function,
.ref,
2020-04-21 18:14:56 -07:00
.ref_val,
2020-04-21 16:48:59 -07:00
.bytes,
=> unreachable,
2020-04-21 21:04:52 -07:00
.zero => return true,
2020-04-21 16:48:59 -07:00
.int_u64 => switch (ty.zigTypeTag()) {
.Int => {
const x = self.cast(Payload.Int_u64).?.int;
2020-04-21 19:19:32 -07:00
if (x == 0) return true;
2020-04-21 16:48:59 -07:00
const info = ty.intInfo(target);
const needed_bits = std.math.log2(x) + 1 + @boolToInt(info.signed);
return info.bits >= needed_bits;
},
.ComptimeInt => return true,
else => unreachable,
},
.int_i64 => switch (ty.zigTypeTag()) {
.Int => {
const x = self.cast(Payload.Int_i64).?.int;
2020-04-21 19:19:32 -07:00
if (x == 0) return true;
2020-04-21 16:48:59 -07:00
const info = ty.intInfo(target);
if (!info.signed and x < 0)
return false;
@panic("TODO implement i64 intFitsInType");
},
.ComptimeInt => return true,
else => unreachable,
},
.int_big => switch (ty.zigTypeTag()) {
.Int => {
const info = ty.intInfo(target);
return self.cast(Payload.IntBig).?.big_int.fitsInTwosComp(info.signed, info.bits);
},
.ComptimeInt => return true,
else => unreachable,
},
}
}
2020-04-21 18:33:55 -07:00
/// Asserts the value is a pointer and dereferences it.
pub fn pointerDeref(self: Value) Value {
switch (self.tag()) {
.ty,
.u8_type,
.i8_type,
.isize_type,
.usize_type,
.c_short_type,
.c_ushort_type,
.c_int_type,
.c_uint_type,
.c_long_type,
.c_ulong_type,
.c_longlong_type,
.c_ulonglong_type,
.c_longdouble_type,
.f16_type,
.f32_type,
.f64_type,
.f128_type,
.c_void_type,
.bool_type,
.void_type,
.type_type,
.anyerror_type,
.comptime_int_type,
.comptime_float_type,
.noreturn_type,
.fn_naked_noreturn_no_args_type,
.single_const_pointer_to_comptime_int_type,
.const_slice_u8_type,
2020-04-21 21:04:52 -07:00
.zero,
2020-04-21 18:33:55 -07:00
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.function,
.int_u64,
.int_i64,
.int_big,
.bytes,
=> unreachable,
.ref => return self.cast(Payload.Ref).?.cell.contents,
.ref_val => return self.cast(Payload.RefVal).?.val,
}
}
2020-04-25 22:20:58 -07:00
/// Asserts the value is a single-item pointer to an array, or an array,
/// or an unknown-length pointer, and returns the element value at the index.
pub fn elemValueAt(self: Value, allocator: *Allocator, index: usize) Allocator.Error!Value {
switch (self.tag()) {
.ty,
.u8_type,
.i8_type,
.isize_type,
.usize_type,
.c_short_type,
.c_ushort_type,
.c_int_type,
.c_uint_type,
.c_long_type,
.c_ulong_type,
.c_longlong_type,
.c_ulonglong_type,
.c_longdouble_type,
.f16_type,
.f32_type,
.f64_type,
.f128_type,
.c_void_type,
.bool_type,
.void_type,
.type_type,
.anyerror_type,
.comptime_int_type,
.comptime_float_type,
.noreturn_type,
.fn_naked_noreturn_no_args_type,
.single_const_pointer_to_comptime_int_type,
.const_slice_u8_type,
.zero,
.void_value,
.noreturn_value,
.bool_true,
.bool_false,
.function,
.int_u64,
.int_i64,
.int_big,
=> unreachable,
.ref => @panic("TODO figure out how MemoryCell works"),
.ref_val => @panic("TODO figure out how MemoryCell works"),
.bytes => {
const int_payload = try allocator.create(Value.Payload.Int_u64);
int_payload.* = .{ .int = self.cast(Payload.Bytes).?.data[index] };
return Value.initPayload(&int_payload.base);
},
}
}
2020-04-18 16:41:45 -07:00
/// This type is not copyable since it may contain pointers to its inner data.
pub const Payload = struct {
tag: Tag,
2020-04-18 16:41:45 -07:00
pub const Int_u64 = struct {
base: Payload = Payload{ .tag = .int_u64 },
int: u64,
};
2020-04-18 16:41:45 -07:00
pub const Int_i64 = struct {
base: Payload = Payload{ .tag = .int_i64 },
int: i64,
};
2020-04-21 14:54:00 -07:00
pub const IntBig = struct {
base: Payload = Payload{ .tag = .int_big },
big_int: BigInt,
};
2020-04-18 16:41:45 -07:00
pub const Function = struct {
base: Payload = Payload{ .tag = .function },
2020-04-21 13:06:15 -07:00
/// Index into the `fns` array of the `ir.Module`
index: usize,
2020-04-18 16:41:45 -07:00
};
pub const ArraySentinel0_u8_Type = struct {
base: Payload = Payload{ .tag = .array_sentinel_0_u8_type },
len: u64,
};
pub const SingleConstPtrType = struct {
base: Payload = Payload{ .tag = .single_const_ptr_type },
elem_type: *Type,
};
pub const Ref = struct {
base: Payload = Payload{ .tag = .ref },
2020-04-21 18:33:55 -07:00
cell: *MemoryCell,
2020-04-18 16:41:45 -07:00
};
2020-04-21 18:14:56 -07:00
pub const RefVal = struct {
base: Payload = Payload{ .tag = .ref_val },
val: Value,
};
2020-04-18 16:41:45 -07:00
pub const Bytes = struct {
base: Payload = Payload{ .tag = .bytes },
2020-04-20 22:20:01 -07:00
data: []const u8,
2020-04-18 16:41:45 -07:00
};
2018-07-13 18:56:38 -07:00
2020-04-18 16:41:45 -07:00
pub const Ty = struct {
2020-04-19 17:04:11 -07:00
base: Payload = Payload{ .tag = .ty },
ty: Type,
2020-04-18 16:41:45 -07:00
};
2020-04-17 21:09:43 -07:00
};
};
2020-04-18 16:41:45 -07:00
/// This is the heart of resource management of the Zig compiler. The Zig compiler uses
/// stop-the-world mark-and-sweep garbage collection during compilation to manage the resources
/// associated with evaluating compile-time code and semantic analysis. Each `MemoryCell` represents
/// a root.
2020-04-17 21:09:43 -07:00
pub const MemoryCell = struct {
parent: Parent,
2020-04-18 16:41:45 -07:00
contents: Value,
2020-04-17 21:09:43 -07:00
pub const Parent = union(enum) {
none,
struct_field: struct {
struct_base: *MemoryCell,
field_index: usize,
2020-04-17 21:09:43 -07:00
},
array_elem: struct {
array_base: *MemoryCell,
elem_index: usize,
2020-04-17 21:09:43 -07:00
},
union_field: *MemoryCell,
err_union_code: *MemoryCell,
err_union_payload: *MemoryCell,
optional_payload: *MemoryCell,
optional_flag: *MemoryCell,
};
};