Skip to content

Commit d357b5c

Browse files
committed
AArch64: make register X29 callee-save
CompCert doesn't maintain a frame pointer in X29. However, it must treat X29 as callee-save, so that CompCert-generated code can be called from code that uses X29 as frame pointer. This commit makes X29 callee-save. In places where X29 was used as a temporary, X15 or X14 is used instead.
1 parent 318fc06 commit d357b5c

File tree

6 files changed

+34
-34
lines changed

6 files changed

+34
-34
lines changed

aarch64/Asm.v

+1-1
Original file line numberDiff line numberDiff line change
@@ -1067,7 +1067,7 @@ Definition exec_instr (f: function) (i: instruction) (rs: regset) (m: mem) : out
10671067
let sp := (Vptr stk Ptrofs.zero) in
10681068
match Mem.storev Mint64 m1 (Val.offset_ptr sp pos) rs#SP with
10691069
| None => Stuck
1070-
| Some m2 => Next (nextinstr (rs #X29 <- (rs#SP) #SP <- sp #X16 <- Vundef)) m2
1070+
| Some m2 => Next (nextinstr (rs #X15 <- (rs#SP) #SP <- sp #X16 <- Vundef)) m2
10711071
end
10721072
| Pfreeframe sz pos =>
10731073
match Mem.loadv Mint64 m (Val.offset_ptr rs#SP pos) with

aarch64/Asmexpand.ml

+10-10
Original file line numberDiff line numberDiff line change
@@ -192,8 +192,8 @@ let memcpy_small_arg sz arg tmp =
192192
assert false
193193

194194
let expand_builtin_memcpy_small sz al src dst =
195-
let tsrc = if dst <> BA (IR X17) then X17 else X29 in
196-
let tdst = if src <> BA (IR X29) then X29 else X17 in
195+
let tsrc = if dst <> BA (IR X17) then X17 else X15 in
196+
let tdst = if src <> BA (IR X15) then X15 else X17 in
197197
let (rsrc, osrc) = memcpy_small_arg sz src tsrc in
198198
let (rdst, odst) = memcpy_small_arg sz dst tdst in
199199
let rec copy osrc odst sz =
@@ -233,29 +233,29 @@ let memcpy_big_arg arg tmp =
233233
let expand_builtin_memcpy_big sz al src dst =
234234
assert (sz >= 16);
235235
memcpy_big_arg src X30;
236-
memcpy_big_arg dst X29;
236+
memcpy_big_arg dst X14;
237237
let lbl = new_label () in
238238
expand_loadimm32 X15 (Z.of_uint (sz / 16));
239239
emit (Plabel lbl);
240240
emit (Pldp(X16, X17, ADpostincr(RR1 X30, _16)));
241-
emit (Pstp(X16, X17, ADpostincr(RR1 X29, _16)));
241+
emit (Pstp(X16, X17, ADpostincr(RR1 X14, _16)));
242242
emit (Psubimm(W, RR1 X15, RR1 X15, _1));
243243
emit (Pcbnz(W, X15, lbl));
244244
if sz mod 16 >= 8 then begin
245245
emit (Pldrx(X16, ADpostincr(RR1 X30, _8)));
246-
emit (Pstrx(X16, ADpostincr(RR1 X29, _8)))
246+
emit (Pstrx(X16, ADpostincr(RR1 X14, _8)))
247247
end;
248248
if sz mod 8 >= 4 then begin
249249
emit (Pldrw(X16, ADpostincr(RR1 X30, _4)));
250-
emit (Pstrw(X16, ADpostincr(RR1 X29, _4)))
250+
emit (Pstrw(X16, ADpostincr(RR1 X14, _4)))
251251
end;
252252
if sz mod 4 >= 2 then begin
253253
emit (Pldrh(W, X16, ADpostincr(RR1 X30, _2)));
254-
emit (Pstrh(X16, ADpostincr(RR1 X29, _2)))
254+
emit (Pstrh(X16, ADpostincr(RR1 X14, _2)))
255255
end;
256256
if sz mod 2 >= 1 then begin
257257
emit (Pldrb(W, X16, ADpostincr(RR1 X30, _1)));
258-
emit (Pstrb(X16, ADpostincr(RR1 X29, _1)))
258+
emit (Pstrb(X16, ADpostincr(RR1 X14, _1)))
259259
end
260260

261261
let expand_builtin_memcpy sz al args =
@@ -412,7 +412,7 @@ let expand_builtin_inline name args res =
412412
let expand_instruction instr =
413413
match instr with
414414
| Pallocframe (sz, ofs) ->
415-
emit (Pmov (RR1 X29, XSP));
415+
emit (Pmov (RR1 X15, XSP));
416416
if is_current_function_variadic() && Archi.abi = Archi.AAPCS64 then begin
417417
let (ir, fr, _) =
418418
next_arg_locations 0 0 0 (get_current_function_args ()) in
@@ -423,7 +423,7 @@ let expand_instruction instr =
423423
current_function_stacksize := Z.to_int64 sz
424424
end;
425425
expand_addimm64 XSP XSP (Ptrofs.repr (Z.neg sz));
426-
expand_storeptr X29 XSP ofs
426+
expand_storeptr X15 XSP ofs
427427
| Pfreeframe (sz, ofs) ->
428428
expand_addimm64 XSP XSP (coqint_of_camlint64 !current_function_stacksize)
429429
| Pcvtx2w rd ->

aarch64/Asmgen.v

+5-5
Original file line numberDiff line numberDiff line change
@@ -1057,16 +1057,16 @@ Definition make_epilogue (f: Mach.function) (k: code) :=
10571057
(** Translation of a Mach instruction. *)
10581058

10591059
Definition transl_instr (f: Mach.function) (i: Mach.instruction)
1060-
(r29_is_parent: bool) (k: code) : res code :=
1060+
(r15_is_parent: bool) (k: code) : res code :=
10611061
match i with
10621062
| Mgetstack ofs ty dst =>
10631063
loadind XSP ofs ty dst k
10641064
| Msetstack src ofs ty =>
10651065
storeind src XSP ofs ty k
10661066
| Mgetparam ofs ty dst =>
10671067
(* load via the frame pointer if it is valid *)
1068-
do c <- loadind X29 ofs ty dst k;
1069-
OK (if r29_is_parent then c else loadptr XSP f.(fn_link_ofs) X29 c)
1068+
do c <- loadind X15 ofs ty dst k;
1069+
OK (if r15_is_parent then c else loadptr XSP f.(fn_link_ofs) X15 c)
10701070
| Mop op args res =>
10711071
transl_op op args res k
10721072
| Mload chunk addr args dst =>
@@ -1102,8 +1102,8 @@ Definition transl_instr (f: Mach.function) (i: Mach.instruction)
11021102
Definition it1_is_parent (before: bool) (i: Mach.instruction) : bool :=
11031103
match i with
11041104
| Msetstack src ofs ty => before
1105-
| Mgetparam ofs ty dst => negb (mreg_eq dst R29)
1106-
| Mop op args res => before && negb (mreg_eq res R29)
1105+
| Mgetparam ofs ty dst => negb (mreg_eq dst R15)
1106+
| Mop op args res => before && negb (mreg_eq res R15)
11071107
| _ => false
11081108
end.
11091109

aarch64/Asmgenproof.v

+12-12
Original file line numberDiff line numberDiff line change
@@ -472,7 +472,7 @@ Inductive match_states: Mach.state -> Asm.state -> Prop :=
472472
(MEXT: Mem.extends m m')
473473
(AT: transl_code_at_pc ge (rs PC) fb f c ep tf tc)
474474
(AG: agree ms sp rs)
475-
(DXP: ep = true -> rs#X29 = parent_sp s),
475+
(DXP: ep = true -> rs#X15 = parent_sp s),
476476
match_states (Mach.State s fb sp c ms m)
477477
(Asm.State rs m')
478478
| match_states_call:
@@ -503,7 +503,7 @@ Lemma exec_straight_steps:
503503
exists rs2,
504504
exec_straight tge tf c rs1 m1' k rs2 m2'
505505
/\ agree ms2 sp rs2
506-
/\ (it1_is_parent ep i = true -> rs2#X29 = parent_sp s)) ->
506+
/\ (it1_is_parent ep i = true -> rs2#X15 = parent_sp s)) ->
507507
exists st',
508508
plus step tge (State rs1 m1') E0 st' /\
509509
match_states (Mach.State s fb sp c ms2 m2) st'.
@@ -614,9 +614,9 @@ Definition measure (s: Mach.state) : nat :=
614614
| Mach.Returnstate _ _ _ => 1%nat
615615
end.
616616

617-
Remark preg_of_not_X29: forall r, negb (mreg_eq r R29) = true -> IR X29 <> preg_of r.
617+
Remark preg_of_not_X15: forall r, negb (mreg_eq r R15) = true -> IR X15 <> preg_of r.
618618
Proof.
619-
intros. change (IR X29) with (preg_of R29). red; intros.
619+
intros. change (IR X15) with (preg_of R15). red; intros.
620620
exploit preg_of_injective; eauto. intros; subst r; discriminate.
621621
Qed.
622622

@@ -672,26 +672,26 @@ Proof.
672672
Opaque loadind.
673673
left; eapply exec_straight_steps; eauto; intros. monadInv TR.
674674
destruct ep.
675-
(* X30 contains parent *)
675+
(* X15 contains parent *)
676676
exploit loadind_correct. eexact EQ.
677677
instantiate (2 := rs0). simpl; rewrite DXP; eauto. simpl; congruence.
678678
intros [rs1 [P [Q R]]].
679679
exists rs1; split. eauto.
680680
split. eapply agree_set_mreg. eapply agree_set_mreg; eauto. congruence. auto with asmgen.
681681
simpl; intros. rewrite R; auto with asmgen.
682-
apply preg_of_not_X29; auto.
683-
(* X30 does not contain parent *)
682+
apply preg_of_not_X15; auto.
683+
(* X15 does not contain parent *)
684684
exploit loadptr_correct. eexact A. simpl; congruence. intros [rs1 [P [Q R]]].
685685
exploit loadind_correct. eexact EQ. instantiate (2 := rs1). simpl; rewrite Q. eauto. simpl; congruence.
686686
intros [rs2 [S [T U]]].
687687
exists rs2; split. eapply exec_straight_trans; eauto.
688688
split. eapply agree_set_mreg. eapply agree_set_mreg. eauto. eauto.
689-
instantiate (1 := rs1#X29 <- (rs2#X29)). intros.
689+
instantiate (1 := rs1#X15 <- (rs2#X15)). intros.
690690
rewrite Pregmap.gso; auto with asmgen.
691691
congruence.
692-
intros. unfold Pregmap.set. destruct (PregEq.eq r' X29). congruence. auto with asmgen.
692+
intros. unfold Pregmap.set. destruct (PregEq.eq r' X15). congruence. auto with asmgen.
693693
simpl; intros. rewrite U; auto with asmgen.
694-
apply preg_of_not_X29; auto.
694+
apply preg_of_not_X15; auto.
695695

696696
- (* Mop *)
697697
assert (eval_operation tge sp op (map rs args) m = Some v).
@@ -704,7 +704,7 @@ Opaque loadind.
704704
apply agree_set_undef_mreg with rs0; auto.
705705
apply Val.lessdef_trans with v'; auto.
706706
simpl; intros. InvBooleans.
707-
rewrite R; auto. apply preg_of_not_X29; auto.
707+
rewrite R; auto. apply preg_of_not_X15; auto.
708708
Local Transparent destroyed_by_op.
709709
destruct op; try exact I; simpl; congruence.
710710

@@ -933,7 +933,7 @@ Local Transparent destroyed_by_op.
933933
set (tfbody := Pallocframe (fn_stacksize f) (fn_link_ofs f) ::
934934
storeptr RA XSP (fn_retaddr_ofs f) x0) in *.
935935
set (tf := {| fn_sig := Mach.fn_sig f; fn_code := tfbody |}) in *.
936-
set (rs2 := nextinstr (rs0#X29 <- (parent_sp s) #SP <- sp #X16 <- Vundef)).
936+
set (rs2 := nextinstr (rs0#X15 <- (parent_sp s) #SP <- sp #X16 <- Vundef)).
937937
exploit (storeptr_correct tge tf XSP (fn_retaddr_ofs f) RA x0 m2' m3' rs2).
938938
simpl preg_of_iregsp. change (rs2 X30) with (rs0 X30). rewrite ATLR.
939939
change (rs2 X2) with sp. eexact P.

aarch64/Conventions1.v

+3-3
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ Definition is_callee_save (r: mreg): bool :=
3838
| R17 => false
3939
| R19 | R20 | R21 | R22 | R23 => true
4040
| R24 | R25 | R26 | R27 | R28 => true
41-
| R29 => false
41+
| R29 => true
4242
| F0 | F1 | F2 | F3 | F4 | F5 | F6 | F7 => false
4343
| F8 | F9 | F10 | F11 | F12 | F13 | F14 | F15 => true
4444
| F16 | F17 | F18 | F19 | F20 | F21 | F22 | F23 => false
@@ -48,7 +48,7 @@ Definition is_callee_save (r: mreg): bool :=
4848
Definition int_caller_save_regs :=
4949
R0 :: R1 :: R2 :: R3 :: R4 :: R5 :: R6 :: R7
5050
:: R8 :: R9 :: R10 :: R11 :: R12 :: R13 :: R14 :: R15
51-
:: R17 :: R29 :: nil.
51+
:: R17 :: nil.
5252

5353
Definition float_caller_save_regs :=
5454
F0 :: F1 :: F2 :: F3 :: F4 :: F5 :: F6 :: F7
@@ -57,7 +57,7 @@ Definition float_caller_save_regs :=
5757

5858
Definition int_callee_save_regs :=
5959
R19 :: R20 :: R21 :: R22 :: R23
60-
:: R24 :: R25 :: R26 :: R27 :: R28 :: nil.
60+
:: R24 :: R25 :: R26 :: R27 :: R28 :: R29 :: nil.
6161

6262
Definition float_callee_save_regs :=
6363
F8 :: F9 :: F10 :: F11 :: F12 :: F13 :: F14 :: F15 :: nil.

aarch64/Machregs.v

+3-3
Original file line numberDiff line numberDiff line change
@@ -156,18 +156,18 @@ Fixpoint destroyed_by_clobber (cl: list string): list mreg :=
156156

157157
Definition destroyed_by_builtin (ef: external_function): list mreg :=
158158
match ef with
159-
| EF_memcpy sz al => R15 :: R17 :: R29 :: nil
159+
| EF_memcpy sz al => R14 :: R15 :: R17 :: nil
160160
| EF_inline_asm txt sg clob => destroyed_by_clobber clob
161161
| _ => nil
162162
end.
163163

164164
Definition destroyed_by_setstack (ty: typ): list mreg := nil.
165165

166-
Definition destroyed_at_function_entry: list mreg := R29 :: nil.
166+
Definition destroyed_at_function_entry: list mreg := R15 :: nil.
167167

168168
Definition destroyed_at_indirect_call: list mreg := nil.
169169

170-
Definition temp_for_parent_frame: mreg := R29.
170+
Definition temp_for_parent_frame: mreg := R15.
171171

172172
Definition mregs_for_operation (op: operation): list (option mreg) * option mreg :=
173173
(nil, None).

0 commit comments

Comments
 (0)