Skip to content

Commit 0398d2e

Browse files
committed
[BOLT] Gadget scanner: detect signing oracles
Implement the detection of signing oracles. In this patch, a signing oracle is defined as a sign instruction that accepts a "non-protected" pointer, but for a slightly different definition of "non-protected" compared to control flow instructions. A second BitVector named TrustedRegs is added to the register state computed by the data-flow analysis. The difference between a "safe-to-dereference" and a "trusted" register states is that to make an unsafe register trusted by authentication, one has to make sure that the authentication succeeded. For example, on AArch64 without FEAT_PAuth2 and FEAT_EPAC, an authentication instruction produces an invalid pointer on failure, so that subsequent memory access triggers an error, but re-signing such pointer would "fix" the signature. Note that while a separate "trusted" register state may be redundant depending on the specific semantics of auth and sign operations, it is still important to check signing operations: while code like this resign: autda x0, x1 pacda x0, x2 ret is probably safe provided `autda` generates an error on authentication failure, this function sign_anything: pacda x0, x1 ret is inherently unsafe.
1 parent 168488e commit 0398d2e

File tree

8 files changed

+2166
-125
lines changed

8 files changed

+2166
-125
lines changed

bolt/include/bolt/Core/MCPlusBuilder.h

+44
Original file line numberDiff line numberDiff line change
@@ -49,6 +49,7 @@ class MCSymbol;
4949
class raw_ostream;
5050

5151
namespace bolt {
52+
class BinaryBasicBlock;
5253
class BinaryFunction;
5354

5455
/// Different types of indirect branches encountered during disassembly.
@@ -572,6 +573,11 @@ class MCPlusBuilder {
572573
return false;
573574
}
574575

576+
virtual MCPhysReg getSignedReg(const MCInst &Inst) const {
577+
llvm_unreachable("not implemented");
578+
return getNoRegister();
579+
}
580+
575581
virtual ErrorOr<MCPhysReg> getRegUsedAsRetDest(const MCInst &Inst) const {
576582
llvm_unreachable("not implemented");
577583
return getNoRegister();
@@ -622,6 +628,44 @@ class MCPlusBuilder {
622628
return std::make_pair(getNoRegister(), getNoRegister());
623629
}
624630

631+
/// Analyzes if a pointer is checked to be authenticated successfully
632+
/// by the end of the basic block.
633+
///
634+
/// It is possible for pointer authentication instructions not to terminate
635+
/// the program abnormally on authentication failure and return some invalid
636+
/// pointer instead (like it is done on AArch64 when FEAT_FPAC is not
637+
/// implemented). This might be enough to crash on invalid memory access when
638+
/// the pointer is later used as the destination of a load, store, or branch
639+
/// instruction. On the other hand, when the pointer is not used right away,
640+
/// it may be important for the compiler to check the address explicitly not
641+
/// to introduce a signing or authentication oracle.
642+
///
643+
/// If this function returns a (Reg, Inst) pair and before execution of Inst
644+
/// Reg was last written to by an authentication instruction, then it is known
645+
/// that in any successor of BB either
646+
/// * the authentication instruction that last wrote to Reg succeeded, or
647+
/// * the program is terminated abnormally without introducing any signing
648+
/// or authentication oracles
649+
virtual std::optional<std::pair<MCPhysReg, MCInst *>>
650+
getAuthCheckedReg(BinaryBasicBlock &BB) const {
651+
llvm_unreachable("not implemented");
652+
return std::nullopt;
653+
}
654+
655+
/// Returns the register that is checked to be authenticated successfully.
656+
///
657+
/// If the returned register was last written to by an authentication
658+
/// instruction and that authentication failed, then the program is known
659+
/// to be terminated abnormally as a result of execution of Inst.
660+
///
661+
/// Additionally, if MayOverwrite is false, it is known that the authenticated
662+
/// pointer is not clobbered by Inst itself.
663+
virtual MCPhysReg getAuthCheckedReg(const MCInst &Inst,
664+
bool MayOverwrite) const {
665+
llvm_unreachable("not implemented");
666+
return getNoRegister();
667+
}
668+
625669
virtual bool isTerminator(const MCInst &Inst) const;
626670

627671
virtual bool isNoop(const MCInst &Inst) const {

bolt/lib/Passes/PAuthGadgetScanner.cpp

+147-8
Original file line numberDiff line numberDiff line change
@@ -173,10 +173,24 @@ class TrackedRegisters {
173173
/// X30 is safe-to-dereference - the state computed for sub- and
174174
/// super-registers is not inspected.
175175
struct SrcState {
176-
/// A BitVector containing the registers that are either safe at function
177-
/// entry and were not clobbered yet, or those not clobbered since being
178-
/// authenticated.
176+
/// A BitVector containing the registers that are either authenticated
177+
/// (assuming failed authentication is permitted to produce an invalid
178+
/// address, provided it generates an error on memory access) or whose
179+
/// value is known not to be attacker-controlled under Pointer Authentication
180+
/// threat model. The registers in this set are either
181+
/// * not clobbered since being authenticated, or
182+
/// * trusted at function entry and were not clobbered yet, or
183+
/// * contain a safely materialized address.
179184
BitVector SafeToDerefRegs;
185+
/// A BitVector containing the registers that are either authenticated
186+
/// *successfully* or whose value is known not to be attacker-controlled
187+
/// under Pointer Authentication threat model.
188+
/// The registers in this set are either
189+
/// * authenticated and then checked to be authenticated successfully
190+
/// (and not clobbered since then), or
191+
/// * trusted at function entry and were not clobbered yet, or
192+
/// * contain a safely materialized address.
193+
BitVector TrustedRegs;
180194
/// A vector of sets, only used in the second data flow run.
181195
/// Each element in the vector represents one of the registers for which we
182196
/// track the set of last instructions that wrote to this register. For
@@ -189,7 +203,8 @@ struct SrcState {
189203
SrcState() {}
190204

191205
SrcState(unsigned NumRegs, unsigned NumRegsToTrack)
192-
: SafeToDerefRegs(NumRegs), LastInstWritingReg(NumRegsToTrack) {}
206+
: SafeToDerefRegs(NumRegs), TrustedRegs(NumRegs),
207+
LastInstWritingReg(NumRegsToTrack) {}
193208

194209
SrcState &merge(const SrcState &StateIn) {
195210
if (StateIn.empty())
@@ -198,6 +213,7 @@ struct SrcState {
198213
return (*this = StateIn);
199214

200215
SafeToDerefRegs &= StateIn.SafeToDerefRegs;
216+
TrustedRegs &= StateIn.TrustedRegs;
201217
for (unsigned I = 0; I < LastInstWritingReg.size(); ++I)
202218
for (const MCInst *J : StateIn.LastInstWritingReg[I])
203219
LastInstWritingReg[I].insert(J);
@@ -210,6 +226,7 @@ struct SrcState {
210226

211227
bool operator==(const SrcState &RHS) const {
212228
return SafeToDerefRegs == RHS.SafeToDerefRegs &&
229+
TrustedRegs == RHS.TrustedRegs &&
213230
LastInstWritingReg == RHS.LastInstWritingReg;
214231
}
215232
bool operator!=(const SrcState &RHS) const { return !((*this) == RHS); }
@@ -234,6 +251,7 @@ raw_ostream &operator<<(raw_ostream &OS, const SrcState &S) {
234251
OS << "empty";
235252
} else {
236253
OS << "SafeToDerefRegs: " << S.SafeToDerefRegs << ", ";
254+
OS << "TrustedRegs: " << S.TrustedRegs << ", ";
237255
printLastInsts(OS, S.LastInstWritingReg);
238256
}
239257
OS << ">";
@@ -254,18 +272,22 @@ void SrcStatePrinter::print(raw_ostream &OS, const SrcState &S) const {
254272
OS << "src-state<";
255273
if (S.empty()) {
256274
assert(S.SafeToDerefRegs.empty());
275+
assert(S.TrustedRegs.empty());
257276
assert(S.LastInstWritingReg.empty());
258277
OS << "empty";
259278
} else {
260279
OS << "SafeToDerefRegs: ";
261280
RegStatePrinter.print(OS, S.SafeToDerefRegs);
281+
OS << ", TrustedRegs: ";
282+
RegStatePrinter.print(OS, S.TrustedRegs);
262283
OS << ", ";
263284
printLastInsts(OS, S.LastInstWritingReg);
264285
}
265286
OS << ">";
266287
}
267288

268-
/// Computes which registers are safe to be used by control flow instructions.
289+
/// Computes which registers are safe to be used by control flow and signing
290+
/// instructions.
269291
///
270292
/// This is the base class for two implementations: a dataflow-based analysis
271293
/// which is intended to be used for most functions and a simplified CFG-unaware
@@ -293,6 +315,17 @@ class SrcSafetyAnalysis {
293315
/// RegToTrackInstsFor is the set of registers for which the dataflow analysis
294316
/// must compute which the last set of instructions writing to it are.
295317
const TrackedRegisters RegsToTrackInstsFor;
318+
/// Stores information about the detected instruction sequences emitted to
319+
/// check an authenticated pointer. Specifically, if such sequence is detected
320+
/// in a basic block, it maps the last instruction of that basic block to
321+
/// (CheckedRegister, FirstInstOfTheSequence) pair, see the description of
322+
/// MCPlusBuilder::getAuthCheckedReg(BB) method.
323+
///
324+
/// As the detection of such sequences requires iterating over the adjacent
325+
/// instructions, it should be done before calling computeNext(), which
326+
/// operates on separate instructions.
327+
DenseMap<const MCInst *, std::pair<MCPhysReg, const MCInst *>>
328+
CheckerSequenceInfo;
296329

297330
SmallPtrSet<const MCInst *, 4> &lastWritingInsts(SrcState &S,
298331
MCPhysReg Reg) const {
@@ -307,8 +340,10 @@ class SrcSafetyAnalysis {
307340

308341
SrcState createEntryState() {
309342
SrcState S(NumRegs, RegsToTrackInstsFor.getNumTrackedRegisters());
310-
for (MCPhysReg Reg : BC.MIB->getTrustedLiveInRegs())
311-
S.SafeToDerefRegs |= BC.MIB->getAliases(Reg, /*OnlySmaller=*/true);
343+
for (MCPhysReg Reg : BC.MIB->getTrustedLiveInRegs()) {
344+
S.TrustedRegs |= BC.MIB->getAliases(Reg, /*OnlySmaller=*/true);
345+
S.SafeToDerefRegs = S.TrustedRegs;
346+
}
312347
return S;
313348
}
314349

@@ -355,6 +390,46 @@ class SrcSafetyAnalysis {
355390
return Regs;
356391
}
357392

393+
// Returns all registers made trusted by this instruction.
394+
SmallVector<MCPhysReg> getRegsMadeTrusted(const MCInst &Point,
395+
const SrcState &Cur) const {
396+
SmallVector<MCPhysReg> Regs;
397+
const MCPhysReg NoReg = BC.MIB->getNoRegister();
398+
399+
// An authenticated pointer can be checked, or
400+
MCPhysReg CheckedReg =
401+
BC.MIB->getAuthCheckedReg(Point, /*MayOverwrite=*/false);
402+
if (CheckedReg != NoReg && Cur.SafeToDerefRegs[CheckedReg])
403+
Regs.push_back(CheckedReg);
404+
405+
if (CheckerSequenceInfo.contains(&Point)) {
406+
MCPhysReg CheckedReg;
407+
const MCInst *FirstCheckerInst;
408+
std::tie(CheckedReg, FirstCheckerInst) = CheckerSequenceInfo.at(&Point);
409+
410+
// FirstCheckerInst should belong to the same basic block, meaning
411+
// it was deterministically processed a few steps before this instruction.
412+
const SrcState &StateBeforeChecker =
413+
getStateBefore(*FirstCheckerInst).get();
414+
if (StateBeforeChecker.SafeToDerefRegs[CheckedReg])
415+
Regs.push_back(CheckedReg);
416+
}
417+
418+
// ... a safe address can be materialized, or
419+
MCPhysReg NewAddrReg = BC.MIB->getMaterializedAddressRegForPtrAuth(Point);
420+
if (NewAddrReg != NoReg)
421+
Regs.push_back(NewAddrReg);
422+
423+
// ... an address can be updated in a safe manner, producing the result
424+
// which is as trusted as the input address.
425+
if (auto DstAndSrc = BC.MIB->analyzeAddressArithmeticsForPtrAuth(Point)) {
426+
if (Cur.TrustedRegs[DstAndSrc->second])
427+
Regs.push_back(DstAndSrc->first);
428+
}
429+
430+
return Regs;
431+
}
432+
358433
SrcState computeNext(const MCInst &Point, const SrcState &Cur) {
359434
SrcStatePrinter P(BC);
360435
LLVM_DEBUG({
@@ -381,11 +456,34 @@ class SrcSafetyAnalysis {
381456
BitVector Clobbered = getClobberedRegs(Point);
382457
SmallVector<MCPhysReg> NewSafeToDerefRegs =
383458
getRegsMadeSafeToDeref(Point, Cur);
459+
SmallVector<MCPhysReg> NewTrustedRegs = getRegsMadeTrusted(Point, Cur);
460+
461+
// Ideally, being trusted is a strictly stronger property than being
462+
// safe-to-dereference. To simplify the computation of Next state, enforce
463+
// this for NewSafeToDerefRegs and NewTrustedRegs. Additionally, this
464+
// fixes the properly for "cumulative" register states in tricky cases
465+
// like the following:
466+
//
467+
// ; LR is safe to dereference here
468+
// mov x16, x30 ; start of the sequence, LR is s-t-d right before
469+
// xpaclri ; clobbers LR, LR is not safe anymore
470+
// cmp x30, x16
471+
// b.eq 1f ; end of the sequence: LR is marked as trusted
472+
// brk 0x1234
473+
// 1:
474+
// ; at this point LR would be marked as trusted,
475+
// ; but not safe-to-dereference
476+
//
477+
for (auto TrustedReg : NewTrustedRegs) {
478+
if (!is_contained(NewSafeToDerefRegs, TrustedReg))
479+
NewSafeToDerefRegs.push_back(TrustedReg);
480+
}
384481

385482
// Then, compute the state after this instruction is executed.
386483
SrcState Next = Cur;
387484

388485
Next.SafeToDerefRegs.reset(Clobbered);
486+
Next.TrustedRegs.reset(Clobbered);
389487
// Keep track of this instruction if it writes to any of the registers we
390488
// need to track that for:
391489
for (MCPhysReg Reg : RegsToTrackInstsFor.getRegisters())
@@ -406,6 +504,10 @@ class SrcSafetyAnalysis {
406504
lastWritingInsts(Next, Reg).clear();
407505
}
408506

507+
// Process new trusted registers.
508+
for (MCPhysReg TrustedReg : NewTrustedRegs)
509+
Next.TrustedRegs |= BC.MIB->getAliases(TrustedReg, /*OnlySmaller=*/true);
510+
409511
LLVM_DEBUG({
410512
dbgs() << " .. result: (";
411513
P.print(dbgs(), Next);
@@ -462,7 +564,22 @@ class DataflowSrcSafetyAnalysis
462564
return DFParent::getStateBefore(Inst);
463565
}
464566

465-
void run() override { DFParent::run(); }
567+
void run() override {
568+
for (BinaryBasicBlock &BB : Func) {
569+
if (auto CheckerInfo = BC.MIB->getAuthCheckedReg(BB)) {
570+
MCInst *LastInstOfChecker = BB.getLastNonPseudoInstr();
571+
LLVM_DEBUG({
572+
dbgs() << "Found pointer checking sequence in " << BB.getName()
573+
<< ":\n";
574+
traceReg(BC, "Checked register", CheckerInfo->first);
575+
traceInst(BC, "First instruction", *CheckerInfo->second);
576+
traceInst(BC, "Last instruction", *LastInstOfChecker);
577+
});
578+
CheckerSequenceInfo[LastInstOfChecker] = *CheckerInfo;
579+
}
580+
}
581+
DFParent::run();
582+
}
466583

467584
protected:
468585
void preflight() {}
@@ -658,6 +775,26 @@ shouldReportCallGadget(const BinaryContext &BC, const MCInstReference &Inst,
658775
return std::make_shared<GadgetReport>(CallKind, Inst, DestReg);
659776
}
660777

778+
static std::shared_ptr<Report>
779+
shouldReportSigningOracle(const BinaryContext &BC, const MCInstReference &Inst,
780+
const SrcState &S) {
781+
static const GadgetKind SigningOracleKind("signing oracle found");
782+
783+
MCPhysReg SignedReg = BC.MIB->getSignedReg(Inst);
784+
if (SignedReg == BC.MIB->getNoRegister())
785+
return nullptr;
786+
787+
LLVM_DEBUG({
788+
traceInst(BC, "Found sign inst", Inst);
789+
traceReg(BC, "Signed reg", SignedReg);
790+
traceRegMask(BC, "TrustedRegs", S.TrustedRegs);
791+
});
792+
if (S.TrustedRegs[SignedReg])
793+
return nullptr;
794+
795+
return std::make_shared<GadgetReport>(SigningOracleKind, Inst, SignedReg);
796+
}
797+
661798
template <typename T> static void iterateOverInstrs(BinaryFunction &BF, T Fn) {
662799
if (BF.hasCFG()) {
663800
for (BinaryBasicBlock &BB : BF)
@@ -702,6 +839,8 @@ Analysis::findGadgets(BinaryFunction &BF,
702839

703840
if (auto Report = shouldReportCallGadget(BC, Inst, S))
704841
Result.Diagnostics.push_back(Report);
842+
if (auto Report = shouldReportSigningOracle(BC, Inst, S))
843+
Result.Diagnostics.push_back(Report);
705844
});
706845
return Result;
707846
}

0 commit comments

Comments
 (0)