[libc++abi] Fix possible infinite loop in itanium demangler
A libfuzzer run has discovered some inputs for which the demangler does not terminate. When minimized, it looks like this: _Zcv1BIRT_EIS1_E Deciphered: _Z cv - conversion operator * result type 1B - "B" I - template args begin R - reference type <. T_ - forward template reference | * E - template args end | | | | * parameter type | | I - template args begin | | S1_ - substitution #1 * <' E - template args end The reason is: template-parameter refs in conversion operator result type create forward-references, while substitutions are instantly resolved via back-references. Together these can create a reference loop. It causes an infinite loop in ReferenceType::collapse(). I see three possible ways to avoid these loops: 1. check if resolving a forward reference creates a loop and reject the invalid input (hard to traverse AST at this point) 2. check if a substitution contains a malicious forward reference and reject the invalid input (hard to traverse AST at this point; substitutions are quite common: may affect performance; hard to clearly detect loops at this point) 3. detect loops in ReferenceType::collapse() (cannot reject the input) This patch implements (3) as seemingly the least-impact change. As a side effect, such invalid input strings are not rejected and produce garbage, however there are already similar guards in `if (Printing) return;` checks. Fixes https://llvm.org/PR51407 Differential Revision: https://reviews.llvm.org/D107712
This commit is contained in:
parent
db7c68d808
commit
f0fcd42495
|
@ -651,8 +651,15 @@ class ReferenceType : public Node {
|
|||
// Dig through any refs to refs, collapsing the ReferenceTypes as we go. The
|
||||
// rule here is rvalue ref to rvalue ref collapses to a rvalue ref, and any
|
||||
// other combination collapses to a lvalue ref.
|
||||
//
|
||||
// A combination of a TemplateForwardReference and a back-ref Substitution
|
||||
// from an ill-formed string may have created a cycle; use cycle detection to
|
||||
// avoid looping forever.
|
||||
std::pair<ReferenceKind, const Node *> collapse(OutputStream &S) const {
|
||||
auto SoFar = std::make_pair(RK, Pointee);
|
||||
// Track the chain of nodes for the Floyd's 'tortoise and hare'
|
||||
// cycle-detection algorithm, since getSyntaxNode(S) is impure
|
||||
PODSmallVector<const Node *, 8> Prev;
|
||||
for (;;) {
|
||||
const Node *SN = SoFar.second->getSyntaxNode(S);
|
||||
if (SN->getKind() != KReferenceType)
|
||||
|
@ -660,6 +667,14 @@ class ReferenceType : public Node {
|
|||
auto *RT = static_cast<const ReferenceType *>(SN);
|
||||
SoFar.second = RT->Pointee;
|
||||
SoFar.first = std::min(SoFar.first, RT->RK);
|
||||
|
||||
// The middle of Prev is the 'slow' pointer moving at half speed
|
||||
Prev.push_back(SoFar.second);
|
||||
if (Prev.size() > 1 && SoFar.second == Prev[(Prev.size() - 1) / 2]) {
|
||||
// Cycle detected
|
||||
SoFar.second = nullptr;
|
||||
break;
|
||||
}
|
||||
}
|
||||
return SoFar;
|
||||
}
|
||||
|
@ -680,6 +695,8 @@ public:
|
|||
return;
|
||||
SwapAndRestore<bool> SavePrinting(Printing, true);
|
||||
std::pair<ReferenceKind, const Node *> Collapsed = collapse(s);
|
||||
if (!Collapsed.second)
|
||||
return;
|
||||
Collapsed.second->printLeft(s);
|
||||
if (Collapsed.second->hasArray(s))
|
||||
s += " ";
|
||||
|
@ -693,6 +710,8 @@ public:
|
|||
return;
|
||||
SwapAndRestore<bool> SavePrinting(Printing, true);
|
||||
std::pair<ReferenceKind, const Node *> Collapsed = collapse(s);
|
||||
if (!Collapsed.second)
|
||||
return;
|
||||
if (Collapsed.second->hasArray(s) || Collapsed.second->hasFunction(s))
|
||||
s += ")";
|
||||
Collapsed.second->printRight(s);
|
||||
|
|
|
@ -9,6 +9,11 @@
|
|||
// The demangler does not pass all these tests with the system dylibs on macOS.
|
||||
// XFAIL: use_system_cxx_lib && target={{.+}}-apple-macosx10.{{9|10|11|12|13|14|15}}
|
||||
|
||||
// https://llvm.org/PR51407 was not fixed in some previously-released
|
||||
// demanglers, which causes them to run into the infinite loop.
|
||||
// UNSUPPORTED: use_system_cxx_lib && target={{.+}}-apple-macosx10.{{9|10|11|12|13|14|15}}
|
||||
// UNSUPPORTED: use_system_cxx_lib && target={{.+}}-apple-macosx11.0
|
||||
|
||||
#include "support/timer.h"
|
||||
#include <cassert>
|
||||
#include <cstdio>
|
||||
|
@ -29844,6 +29849,9 @@ const char* cases[][2] =
|
|||
|
||||
{"_ZN3xxx3yyyIvNS_1AILm0EEEZNS_2bb2cc2ddILNS_1eE1EEEvRKNS_1fERKNS_1g1hINS_1iEEERKNS_1jEfRKNS_1kEiPhEUlvE_JEEEvT1_DpT2_", "void xxx::yyy<void, xxx::A<0ul>, void xxx::bb::cc::dd<(xxx::e)1>(xxx::f const&, xxx::g::h<xxx::i> const&, xxx::j const&, float, xxx::k const&, int, unsigned char*)::'lambda'()>(void xxx::bb::cc::dd<(xxx::e)1>(xxx::f const&, xxx::g::h<xxx::i> const&, xxx::j const&, float, xxx::k const&, int, unsigned char*)::'lambda'())"},
|
||||
|
||||
// This should be invalid, but it is currently not recognized as such
|
||||
// See https://llvm.org/PR51407
|
||||
{"_Zcv1BIRT_EIS1_E", "operator B<><>"},
|
||||
};
|
||||
|
||||
const unsigned N = sizeof(cases) / sizeof(cases[0]);
|
||||
|
|
|
@ -651,8 +651,15 @@ class ReferenceType : public Node {
|
|||
// Dig through any refs to refs, collapsing the ReferenceTypes as we go. The
|
||||
// rule here is rvalue ref to rvalue ref collapses to a rvalue ref, and any
|
||||
// other combination collapses to a lvalue ref.
|
||||
//
|
||||
// A combination of a TemplateForwardReference and a back-ref Substitution
|
||||
// from an ill-formed string may have created a cycle; use cycle detection to
|
||||
// avoid looping forever.
|
||||
std::pair<ReferenceKind, const Node *> collapse(OutputStream &S) const {
|
||||
auto SoFar = std::make_pair(RK, Pointee);
|
||||
// Track the chain of nodes for the Floyd's 'tortoise and hare'
|
||||
// cycle-detection algorithm, since getSyntaxNode(S) is impure
|
||||
PODSmallVector<const Node *, 8> Prev;
|
||||
for (;;) {
|
||||
const Node *SN = SoFar.second->getSyntaxNode(S);
|
||||
if (SN->getKind() != KReferenceType)
|
||||
|
@ -660,6 +667,14 @@ class ReferenceType : public Node {
|
|||
auto *RT = static_cast<const ReferenceType *>(SN);
|
||||
SoFar.second = RT->Pointee;
|
||||
SoFar.first = std::min(SoFar.first, RT->RK);
|
||||
|
||||
// The middle of `Prev` is the 'slow' pointer moving at half speed
|
||||
Prev.push_back(SoFar.second);
|
||||
if (Prev.size() > 1 && SoFar.second == Prev[(Prev.size() - 1) / 2]) {
|
||||
// Cycle detected
|
||||
SoFar.second = nullptr;
|
||||
break;
|
||||
}
|
||||
}
|
||||
return SoFar;
|
||||
}
|
||||
|
@ -680,6 +695,8 @@ public:
|
|||
return;
|
||||
SwapAndRestore<bool> SavePrinting(Printing, true);
|
||||
std::pair<ReferenceKind, const Node *> Collapsed = collapse(s);
|
||||
if (!Collapsed.second)
|
||||
return;
|
||||
Collapsed.second->printLeft(s);
|
||||
if (Collapsed.second->hasArray(s))
|
||||
s += " ";
|
||||
|
@ -693,6 +710,8 @@ public:
|
|||
return;
|
||||
SwapAndRestore<bool> SavePrinting(Printing, true);
|
||||
std::pair<ReferenceKind, const Node *> Collapsed = collapse(s);
|
||||
if (!Collapsed.second)
|
||||
return;
|
||||
if (Collapsed.second->hasArray(s) || Collapsed.second->hasFunction(s))
|
||||
s += ")";
|
||||
Collapsed.second->printRight(s);
|
||||
|
|
Loading…
Reference in New Issue