Skip to content

Commit cc36b5c

Browse files
committed
support pointer subtraction
1 parent 103b885 commit cc36b5c

File tree

7 files changed

+144
-47
lines changed

7 files changed

+144
-47
lines changed

doc/langref.html.in

+6-3
Original file line numberDiff line numberDiff line change
@@ -1934,16 +1934,18 @@ or
19341934
<li>{#syntax#}*T{#endsyntax#} - single-item pointer to exactly one item.
19351935
<ul>
19361936
<li>Supports deref syntax: {#syntax#}ptr.*{#endsyntax#}</li>
1937+
<li>Supports pointer subtraction: {#syntax#}ptr - ptr{#endsyntax#}</li>
19371938
</ul>
19381939
</li>
19391940
<li>{#syntax#}[*]T{#endsyntax#} - many-item pointer to unknown number of items.
19401941
<ul>
19411942
<li>Supports index syntax: {#syntax#}ptr[i]{#endsyntax#}</li>
19421943
<li>Supports slice syntax: {#syntax#}ptr[start..end]{#endsyntax#} and {#syntax#}ptr[start..]{#endsyntax#}</li>
1943-
<li>Supports pointer arithmetic: {#syntax#}ptr + x{#endsyntax#}, {#syntax#}ptr - x{#endsyntax#}</li>
1944-
<li>{#syntax#}T{#endsyntax#} must have a known size, which means that it cannot be
1945-
{#syntax#}anyopaque{#endsyntax#} or any other {#link|opaque type|opaque#}.</li>
1944+
<li>Supports pointer-integer arithmetic: {#syntax#}ptr + int{#endsyntax#}, {#syntax#}ptr - int{#endsyntax#}</li>
1945+
<li>Supports pointer subtraction: {#syntax#}ptr - ptr{#endsyntax#}</li>
19461946
</ul>
1947+
{#syntax#}T{#endsyntax#} must have a known size, which means that it cannot be
1948+
{#syntax#}anyopaque{#endsyntax#} or any other {#link|opaque type|opaque#}.
19471949
</li>
19481950
</ul>
19491951
<p>These types are closely related to {#link|Arrays#} and {#link|Slices#}:</p>
@@ -1953,6 +1955,7 @@ or
19531955
<li>Supports index syntax: {#syntax#}array_ptr[i]{#endsyntax#}</li>
19541956
<li>Supports slice syntax: {#syntax#}array_ptr[start..end]{#endsyntax#}</li>
19551957
<li>Supports len property: {#syntax#}array_ptr.len{#endsyntax#}</li>
1958+
<li>Supports pointer subtraction: {#syntax#}array_ptr - array_ptr{#endsyntax#}</li>
19561959
</ul>
19571960
</li>
19581961
</ul>

doc/langref/test_pointer_arithmetic.zig

+3
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,9 @@ test "pointer arithmetic with many-item pointer" {
1111
// slicing a many-item pointer without an end is equivalent to
1212
// pointer arithmetic: `ptr[start..] == ptr + start`
1313
try expect(ptr[1..] == ptr + 1);
14+
15+
// subtraction between the memory addresses of any two pointers except slices is supported
16+
try expect(&ptr[1] - &ptr[0] == @sizeOf(i32));
1417
}
1518

1619
test "pointer arithmetic with slices" {

lib/std/hash_map.zig

+1-2
Original file line numberDiff line numberDiff line change
@@ -1483,12 +1483,11 @@ pub fn HashMapUnmanaged(
14831483
/// key_ptr is assumed to be a valid pointer to a key that is present
14841484
/// in the hash map.
14851485
pub fn removeByPtr(self: *Self, key_ptr: *K) void {
1486-
// TODO: replace with pointer subtraction once supported by zig
14871486
// if @sizeOf(K) == 0 then there is at most one item in the hash
14881487
// map, which is assumed to exist as key_ptr must be valid. This
14891488
// item must be at index 0.
14901489
const idx = if (@sizeOf(K) > 0)
1491-
(@intFromPtr(key_ptr) - @intFromPtr(self.keys())) / @sizeOf(K)
1490+
(key_ptr - self.keys()) / @sizeOf(K)
14921491
else
14931492
0;
14941493

src/InternPool.zig

+19-15
Original file line numberDiff line numberDiff line change
@@ -1112,6 +1112,23 @@ pub const Key = union(enum) {
11121112
/// the original pointer type alignment must be used.
11131113
orig_ty: Index,
11141114
};
1115+
1116+
pub fn eql(a: BaseAddr, b: BaseAddr) bool {
1117+
if (@as(Key.Ptr.BaseAddr.Tag, a) != @as(Key.Ptr.BaseAddr.Tag, b)) return false;
1118+
1119+
return switch (a) {
1120+
.decl => |a_decl| a_decl == b.decl,
1121+
.comptime_alloc => |a_alloc| a_alloc == b.comptime_alloc,
1122+
.anon_decl => |ad| ad.val == b.anon_decl.val and
1123+
ad.orig_ty == b.anon_decl.orig_ty,
1124+
.int => true,
1125+
.eu_payload => |a_eu_payload| a_eu_payload == b.eu_payload,
1126+
.opt_payload => |a_opt_payload| a_opt_payload == b.opt_payload,
1127+
.comptime_field => |a_comptime_field| a_comptime_field == b.comptime_field,
1128+
.arr_elem => |a_elem| std.meta.eql(a_elem, b.arr_elem),
1129+
.field => |a_field| std.meta.eql(a_field, b.field),
1130+
};
1131+
}
11151132
};
11161133
};
11171134

@@ -1550,21 +1567,8 @@ pub const Key = union(enum) {
15501567
const b_info = b.ptr;
15511568
if (a_info.ty != b_info.ty) return false;
15521569
if (a_info.byte_offset != b_info.byte_offset) return false;
1553-
1554-
if (@as(Key.Ptr.BaseAddr.Tag, a_info.base_addr) != @as(Key.Ptr.BaseAddr.Tag, b_info.base_addr)) return false;
1555-
1556-
return switch (a_info.base_addr) {
1557-
.decl => |a_decl| a_decl == b_info.base_addr.decl,
1558-
.comptime_alloc => |a_alloc| a_alloc == b_info.base_addr.comptime_alloc,
1559-
.anon_decl => |ad| ad.val == b_info.base_addr.anon_decl.val and
1560-
ad.orig_ty == b_info.base_addr.anon_decl.orig_ty,
1561-
.int => true,
1562-
.eu_payload => |a_eu_payload| a_eu_payload == b_info.base_addr.eu_payload,
1563-
.opt_payload => |a_opt_payload| a_opt_payload == b_info.base_addr.opt_payload,
1564-
.comptime_field => |a_comptime_field| a_comptime_field == b_info.base_addr.comptime_field,
1565-
.arr_elem => |a_elem| std.meta.eql(a_elem, b_info.base_addr.arr_elem),
1566-
.field => |a_field| std.meta.eql(a_field, b_info.base_addr.field),
1567-
};
1570+
if (!a_info.base_addr.eql(b_info.base_addr)) return false;
1571+
return true;
15681572
},
15691573

15701574
.int => |a_info| {

src/Sema.zig

+71-25
Original file line numberDiff line numberDiff line change
@@ -2391,6 +2391,16 @@ fn failWithComptimeErrorRetTrace(
23912391
return sema.failWithOwnedErrorMsg(block, msg);
23922392
}
23932393

2394+
fn failWithInvalidPtrArithmetic(sema: *Sema, block: *Block, src: LazySrcLoc, arithmetic: []const u8, supports: []const u8) CompileError {
2395+
const msg = msg: {
2396+
const msg = try sema.errMsg(block, src, "invalid {s} arithmetic operator", .{arithmetic});
2397+
errdefer msg.destroy(sema.gpa);
2398+
try sema.errNote(block, src, msg, "{s} arithmetic only supports {s}", .{ arithmetic, supports });
2399+
break :msg msg;
2400+
};
2401+
return sema.failWithOwnedErrorMsg(block, msg);
2402+
}
2403+
23942404
/// We don't return a pointer to the new error note because the pointer
23952405
/// becomes invalid when you add another one.
23962406
fn errNote(
@@ -15146,7 +15156,7 @@ fn zirDiv(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Air.Ins
1514615156
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1514715157
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1514815158
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
15149-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
15159+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1515015160

1515115161
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1515215162
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -15311,7 +15321,7 @@ fn zirDivExact(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Ai
1531115321
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1531215322
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1531315323
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
15314-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
15324+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1531515325

1531615326
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1531715327
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -15476,7 +15486,7 @@ fn zirDivFloor(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Ai
1547615486
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1547715487
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1547815488
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
15479-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
15489+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1548015490

1548115491
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1548215492
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -15586,7 +15596,7 @@ fn zirDivTrunc(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Ai
1558615596
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1558715597
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1558815598
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
15589-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
15599+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1559015600

1559115601
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1559215602
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -15827,7 +15837,7 @@ fn zirModRem(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Air.
1582715837
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1582815838
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1582915839
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
15830-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
15840+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1583115841

1583215842
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1583315843
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -16011,7 +16021,7 @@ fn zirMod(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Air.Ins
1601116021
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1601216022
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1601316023
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
16014-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
16024+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1601516025

1601616026
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1601716027
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -16106,7 +16116,7 @@ fn zirRem(sema: *Sema, block: *Block, inst: Zir.Inst.Index) CompileError!Air.Ins
1610616116
const lhs_zig_ty_tag = try lhs_ty.zigTypeTagOrPoison(mod);
1610716117
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1610816118
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
16109-
try sema.checkInvalidPtrArithmetic(block, src, lhs_ty);
16119+
try sema.checkInvalidPtrIntArithmetic(block, src, lhs_ty);
1611016120

1611116121
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1611216122
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -16445,17 +16455,58 @@ fn analyzeArithmetic(
1644516455
const rhs_zig_ty_tag = try rhs_ty.zigTypeTagOrPoison(mod);
1644616456
try sema.checkVectorizableBinaryOperands(block, src, lhs_ty, rhs_ty, lhs_src, rhs_src);
1644716457

16448-
if (lhs_zig_ty_tag == .Pointer) switch (lhs_ty.ptrSize(mod)) {
16449-
.One, .Slice => {},
16450-
.Many, .C => {
16451-
const air_tag: Air.Inst.Tag = switch (zir_tag) {
16452-
.add => .ptr_add,
16453-
.sub => .ptr_sub,
16454-
else => return sema.fail(block, src, "invalid pointer arithmetic operator", .{}),
16455-
};
16456-
return sema.analyzePtrArithmetic(block, src, lhs, rhs, air_tag, lhs_src, rhs_src);
16457-
},
16458-
};
16458+
if (lhs_zig_ty_tag == .Pointer) {
16459+
if (rhs_zig_ty_tag == .Pointer) {
16460+
if (lhs_ty.ptrSize(mod) != .Slice and rhs_ty.ptrSize(mod) != .Slice) {
16461+
if (zir_tag != .sub) {
16462+
return sema.failWithInvalidPtrArithmetic(block, src, "pointer-pointer", "subtraction");
16463+
}
16464+
16465+
const runtime_src = runtime_src: {
16466+
if (try sema.resolveValue(lhs)) |lhs_value| {
16467+
if (try sema.resolveValue(rhs)) |rhs_value| {
16468+
const lhs_ptr = switch (mod.intern_pool.indexToKey(lhs_value.toIntern())) {
16469+
.undef => return sema.failWithUseOfUndef(block, lhs_src),
16470+
.ptr => |ptr| ptr,
16471+
else => unreachable,
16472+
};
16473+
const rhs_ptr = switch (mod.intern_pool.indexToKey(rhs_value.toIntern())) {
16474+
.undef => return sema.failWithUseOfUndef(block, rhs_src),
16475+
.ptr => |ptr| ptr,
16476+
else => unreachable,
16477+
};
16478+
// Make sure the pointers point to the same data.
16479+
if (!lhs_ptr.base_addr.eql(rhs_ptr.base_addr)) break :runtime_src src;
16480+
const address = std.math.sub(u64, lhs_ptr.byte_offset, rhs_ptr.byte_offset) catch
16481+
return sema.fail(block, src, "operation results in overflow", .{});
16482+
return try mod.intRef(Type.usize, address);
16483+
} else {
16484+
break :runtime_src lhs_src;
16485+
}
16486+
} else {
16487+
break :runtime_src rhs_src;
16488+
}
16489+
};
16490+
16491+
try sema.requireRuntimeBlock(block, src, runtime_src);
16492+
const lhs_int = try block.addUnOp(.int_from_ptr, lhs);
16493+
const rhs_int = try block.addUnOp(.int_from_ptr, rhs);
16494+
return try block.addBinOp(.sub_wrap, lhs_int, rhs_int);
16495+
}
16496+
} else {
16497+
switch (lhs_ty.ptrSize(mod)) {
16498+
.One, .Slice => {},
16499+
.Many, .C => {
16500+
const air_tag: Air.Inst.Tag = switch (zir_tag) {
16501+
.add => .ptr_add,
16502+
.sub => .ptr_sub,
16503+
else => return sema.failWithInvalidPtrArithmetic(block, src, "pointer-integer", "addition and subtraction"),
16504+
};
16505+
return sema.analyzePtrArithmetic(block, src, lhs, rhs, air_tag, lhs_src, rhs_src);
16506+
},
16507+
}
16508+
}
16509+
}
1645916510

1646016511
const instructions = &[_]Air.Inst.Ref{ lhs, rhs };
1646116512
const resolved_type = try sema.resolvePeerTypes(block, src, instructions, .{
@@ -23715,7 +23766,7 @@ fn checkIntType(sema: *Sema, block: *Block, src: LazySrcLoc, ty: Type) CompileEr
2371523766
}
2371623767
}
2371723768

23718-
fn checkInvalidPtrArithmetic(
23769+
fn checkInvalidPtrIntArithmetic(
2371923770
sema: *Sema,
2372023771
block: *Block,
2372123772
src: LazySrcLoc,
@@ -23725,12 +23776,7 @@ fn checkInvalidPtrArithmetic(
2372523776
switch (try ty.zigTypeTagOrPoison(mod)) {
2372623777
.Pointer => switch (ty.ptrSize(mod)) {
2372723778
.One, .Slice => return,
23728-
.Many, .C => return sema.fail(
23729-
block,
23730-
src,
23731-
"invalid pointer arithmetic operator",
23732-
.{},
23733-
),
23779+
.Many, .C => return sema.failWithInvalidPtrArithmetic(block, src, "pointer-integer", "addition and subtraction"),
2373423780
},
2373523781
else => return,
2373623782
}

test/behavior/pointers.zig

+28-2
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ fn testDerefPtr() !void {
1717
try expect(x == 1235);
1818
}
1919

20-
test "pointer arithmetic" {
20+
test "pointer-integer arithmetic" {
2121
if (builtin.zig_backend == .stage2_aarch64) return error.SkipZigTest;
2222
if (builtin.zig_backend == .stage2_sparc64) return error.SkipZigTest; // TODO
2323
if (builtin.zig_backend == .stage2_riscv64) return error.SkipZigTest;
@@ -43,6 +43,32 @@ test "pointer arithmetic" {
4343
try expect(ptr[0] == 'a');
4444
}
4545

46+
test "pointer subtraction" {
47+
if (builtin.zig_backend == .stage2_sparc64) return error.SkipZigTest; // TODO
48+
if (builtin.zig_backend == .stage2_riscv64) return error.SkipZigTest;
49+
50+
{
51+
const a: *u8 = @ptrFromInt(100);
52+
const b: *u8 = @ptrFromInt(50);
53+
try expect(a - b == 50);
54+
}
55+
{
56+
var ptr: [*]const u8 = "abc";
57+
try expect(&ptr[1] - &ptr[0] == 1);
58+
try expect(&ptr[2] - &ptr[0] == 2);
59+
}
60+
{
61+
const a: *[100]u8 = @ptrFromInt(100);
62+
const b: *[100]u8 = @ptrFromInt(50);
63+
try expect(a - b == 50);
64+
}
65+
comptime {
66+
const a: *const [3]u8 = "abc";
67+
const b: [*]const u8 = @ptrCast(a);
68+
try expect(&a[1] - &b[0] == 1);
69+
}
70+
}
71+
4672
test "double pointer parsing" {
4773
comptime assert(PtrOf(PtrOf(i32)) == **i32);
4874
}
@@ -385,7 +411,7 @@ test "pointer to array at fixed address" {
385411
try expect(@intFromPtr(&array[1]) == 0x14);
386412
}
387413

388-
test "pointer arithmetic affects the alignment" {
414+
test "pointer-integer arithmetic affects the alignment" {
389415
{
390416
var ptr: [*]align(8) u32 = undefined;
391417
var x: usize = 1;
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
export fn a(x: [*]u8) void {
2+
_ = x * 1;
3+
}
4+
5+
export fn b(x: *u8) void {
6+
_ = x * x;
7+
}
8+
9+
// error
10+
// backend=stage2
11+
// target=native
12+
//
13+
// :2:11: error: invalid pointer-integer arithmetic operator
14+
// :2:11: note: pointer-integer arithmetic only supports addition and subtraction
15+
// :6:11: error: invalid pointer-pointer arithmetic operator
16+
// :6:11: note: pointer-pointer arithmetic only supports subtraction

0 commit comments

Comments
 (0)