From eb5fc6cd37d115916e6f2d09ae49084c5eeef3b1 Mon Sep 17 00:00:00 2001 From: Szymon Tomasz Stefanek Date: Sat, 26 May 2018 03:01:11 +0200 Subject: [PATCH 1/2] CXX: Fix #1750 (without breaking other unit tests) --- .../expected.tags | 2 - .../args.ctags | 0 .../expected.tags | 2 + .../input.hpp | 0 parsers/cxx/cxx_parser_template.c | 176 ++++++++++++++---- 5 files changed, 143 insertions(+), 37 deletions(-) delete mode 100644 Units/parser-cxx.r/template-nested-triangle-brackets.b/expected.tags rename Units/parser-cxx.r/{template-nested-triangle-brackets.b => template-nested-triangle-brackets.d}/args.ctags (100%) create mode 100644 Units/parser-cxx.r/template-nested-triangle-brackets.d/expected.tags rename Units/parser-cxx.r/{template-nested-triangle-brackets.b => template-nested-triangle-brackets.d}/input.hpp (100%) diff --git a/Units/parser-cxx.r/template-nested-triangle-brackets.b/expected.tags b/Units/parser-cxx.r/template-nested-triangle-brackets.b/expected.tags deleted file mode 100644 index e5499e69e6..0000000000 --- a/Units/parser-cxx.r/template-nested-triangle-brackets.b/expected.tags +++ /dev/null @@ -1,2 +0,0 @@ -Test input.hpp /^class Test : public set {$/;" c template:template:,class _Comp1=less>> -xxx input.hpp /^ typedef int xxx;$/;" t class:Test typeref:typename:int diff --git a/Units/parser-cxx.r/template-nested-triangle-brackets.b/args.ctags b/Units/parser-cxx.r/template-nested-triangle-brackets.d/args.ctags similarity index 100% rename from Units/parser-cxx.r/template-nested-triangle-brackets.b/args.ctags rename to Units/parser-cxx.r/template-nested-triangle-brackets.d/args.ctags diff --git a/Units/parser-cxx.r/template-nested-triangle-brackets.d/expected.tags b/Units/parser-cxx.r/template-nested-triangle-brackets.d/expected.tags new file mode 100644 index 0000000000..b11ce65350 --- /dev/null +++ b/Units/parser-cxx.r/template-nested-triangle-brackets.d/expected.tags @@ -0,0 +1,2 @@ +Test input.hpp /^class Test : public set {$/;" c template:,class _Comp1=less>> +xxx input.hpp /^ typedef int xxx;$/;" t class:Test typeref:typename:int diff --git a/Units/parser-cxx.r/template-nested-triangle-brackets.b/input.hpp b/Units/parser-cxx.r/template-nested-triangle-brackets.d/input.hpp similarity index 100% rename from Units/parser-cxx.r/template-nested-triangle-brackets.b/input.hpp rename to Units/parser-cxx.r/template-nested-triangle-brackets.d/input.hpp diff --git a/parsers/cxx/cxx_parser_template.c b/parsers/cxx/cxx_parser_template.c index 16b40951b9..64f0a1c7a5 100644 --- a/parsers/cxx/cxx_parser_template.c +++ b/parsers/cxx/cxx_parser_template.c @@ -24,12 +24,25 @@ #include +typedef enum _CXXParserParseTemplateAngleBracketsResult +{ + // Succeeded parsing the template angle bracket, everything looks fine + CXXParserParseTemplateAngleBracketsSucceeded, + // Succeeded, but the parsing was unbalanced and was terminated by an 'unexpected' condition + // that detected the end of the template. If this is function has been called + // from an upper template parsing level, the caller should exit too. + CXXParserParseTemplateAngleBracketsFinishedPrematurely, + // Failed miserably, continuing parsing is not possible + CXXParserParseTemplateAngleBracketsFailed, + // Failed miserably, but it may be possible to continue parsing + CXXParserParseTemplateAngleBracketsFailedRecoverable +} CXXParserParseTemplateAngleBracketsResult; // // Parses the part of a template specification. // Here we are pointing at the initial <. // -static bool cxxParserParseTemplateAngleBrackets(void) +static CXXParserParseTemplateAngleBracketsResult cxxParserParseTemplateAngleBracketsInternal(void) { CXX_DEBUG_ENTER(); @@ -65,14 +78,14 @@ static bool cxxParserParseTemplateAngleBrackets(void) if(!cxxParserParseAndCondenseSubchainsUpToOneOf( CXXTokenTypeGreaterThanSign | CXXTokenTypeSmallerThanSign | CXXTokenTypeOpeningBracket | CXXTokenTypeSemicolon | - CXXTokenTypeEOF | CXXTokenTypeAssignment, + CXXTokenTypeEOF | CXXTokenTypeKeyword, CXXTokenTypeOpeningParenthesis | CXXTokenTypeOpeningSquareParenthesis, false )) { CXX_DEBUG_LEAVE_TEXT("Failed to parse up to '<>{EOF'"); - return false; + return CXXParserParseTemplateAngleBracketsFailed; } evaluate_current_token: @@ -90,7 +103,7 @@ static bool cxxParserParseTemplateAngleBrackets(void) if(!cxxParserParseNextToken()) { CXX_DEBUG_LEAVE_TEXT("Syntax error, but tolerate it at this level"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; } CXX_DEBUG_PRINT( @@ -123,14 +136,15 @@ static bool cxxParserParseTemplateAngleBrackets(void) )) { CXX_DEBUG_LEAVE_TEXT("Failed to condense current subchain"); - return true; + return CXXParserParseTemplateAngleBracketsFailed; } + if(cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeEOF)) { CXX_DEBUG_LEAVE_TEXT( "Found EOF, syntax error but we tolerate it" ); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; } } else { // it's ok @@ -143,18 +157,22 @@ static bool cxxParserParseTemplateAngleBrackets(void) } break; case CXXTokenTypeGreaterThanSign: + { if(iTemplateLevel == 0) { // Non-nested > : always a terminator CXX_DEBUG_LEAVE_TEXT("Found end of template"); - return true; + return CXXParserParseTemplateAngleBracketsSucceeded; } - // Nested > : is it a shift operator? + + // Nested > : is is a shift operator? + + bool bFollowedBySpace = g_cxx.pToken->bFollowedBySpace; if(!cxxParserParseNextToken()) { CXX_DEBUG_LEAVE_TEXT("Syntax error, but tolerate it at this level"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; } CXX_DEBUG_PRINT( @@ -163,7 +181,9 @@ static bool cxxParserParseTemplateAngleBrackets(void) g_cxx.pToken->eType ); - if(cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeGreaterThanSign)) + bool bIsGreaterThan = cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeGreaterThanSign); + + if((!bFollowedBySpace) && bIsGreaterThan) { // assume it's an operator CXX_DEBUG_PRINT("Treating > as shift-right operator"); @@ -171,6 +191,32 @@ static bool cxxParserParseTemplateAngleBrackets(void) CXX_DEBUG_PRINT("Decreasing template level"); iTemplateLevel--; + if(bIsGreaterThan) + goto evaluate_current_token; + + // Handle gracefully some cases + if( + cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeKeyword) && + (!cxxKeywordIsConstant(g_cxx.pToken->eKeyword)) + ) + { + // We found something like + // ... > void ... + // ... > static ... + // The part on the right of > does not seem to be a constant + // so this is not a comparison. Most likely explaination: + // We screwed up the parsing of the template. + // However we can still attempt to emit a symbol here. + CXX_DEBUG_PRINT( + "Found '> %s': assuming end of template", + vStringValue(g_cxx.pToken->pszWord) + ); + + cxxParserUngetCurrentToken(); + CXX_DEBUG_LEAVE_TEXT("Found (broken) end of template"); + return CXXParserParseTemplateAngleBracketsFinishedPrematurely; + } + if(cxxTokenTypeIsOneOf( g_cxx.pToken, CXXTokenTypeOpeningParenthesis | @@ -187,45 +233,79 @@ static bool cxxParserParseTemplateAngleBrackets(void) )) { CXX_DEBUG_LEAVE_TEXT("Failed to condense current subchain"); - return true; + return CXXParserParseTemplateAngleBracketsFailed; } + if(cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeEOF)) { CXX_DEBUG_LEAVE_TEXT("Found EOF, syntax error but we tolerate it"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; } } else { // it's ok CXX_DEBUG_PRINT("No need to condense subchain"); } } + } break; - case CXXTokenTypeComma: - case CXXTokenTypeAssignment: - CXX_DEBUG_PRINT("Found assignment, trying to skip up to a 'notable' point"); - // try to skip to the next > or , without stopping at < characters. - if(!cxxParserParseUpToOneOf( - CXXTokenTypeGreaterThanSign | CXXTokenTypeComma | - CXXTokenTypeOpeningBracket | CXXTokenTypeSemicolon | - CXXTokenTypeEOF, - false - )) + case CXXTokenTypeKeyword: + if(cxxTokenIsKeyword(g_cxx.pToken,CXXKeywordTEMPLATE)) { - CXX_DEBUG_LEAVE_TEXT("Failed to parse up to '}EOF'"); - return false; + CXX_DEBUG_PRINT("Found nested template keyword"); + + // nested nastiness. + if(!cxxParserParseNextToken()) + { + CXX_DEBUG_LEAVE_TEXT("Syntax error, but tolerate it at this level"); + return CXXParserParseTemplateAngleBracketsFailedRecoverable; + } + + if(!cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeSmallerThanSign)) + { + // aaargh... + CXX_DEBUG_PRINT( + "Found unexpected token '%s' of type 0x%02x", + vStringValue(g_cxx.pToken->pszWord), + g_cxx.pToken->eType + ); + + CXX_DEBUG_LEAVE_TEXT("No smaller than sign after template keyword"); + return CXXParserParseTemplateAngleBracketsFailed; + } + + switch(cxxParserParseTemplateAngleBracketsInternal()) + { + case CXXParserParseTemplateAngleBracketsFailed: + CXX_DEBUG_LEAVE_TEXT("Nested template parsing failed"); + return CXXParserParseTemplateAngleBracketsFailed; + break; + case CXXParserParseTemplateAngleBracketsFailedRecoverable: + CXX_DEBUG_LEAVE_TEXT("Nested template parsing recovered"); + return CXXParserParseTemplateAngleBracketsFailedRecoverable; + break; + case CXXParserParseTemplateAngleBracketsFinishedPrematurely: + CXX_DEBUG_LEAVE_TEXT("Nested template finished prematurely"); + return CXXParserParseTemplateAngleBracketsFinishedPrematurely; + break; + case CXXParserParseTemplateAngleBracketsSucceeded: + // ok + CXX_DEBUG_PRINT("Nested template parsing succeeded"); + break; + default: + CXX_DEBUG_ASSERT(false,"Should never end up here"); + return CXXParserParseTemplateAngleBracketsFailed; + break; + } } - if(!cxxTokenTypeIs(g_cxx.pToken,CXXTokenTypeComma)) - goto evaluate_current_token; // backward jump to re-evaluate token - // else continue parsing at this level. break; case CXXTokenTypeEOF: CXX_DEBUG_LEAVE_TEXT("Syntax error, but tolerate it at this level"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; break; case CXXTokenTypeSemicolon: cxxParserNewStatement(); CXX_DEBUG_LEAVE_TEXT("Broken template arguments, attempting to continue"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; break; case CXXTokenTypeOpeningBracket: CXX_DEBUG_PRINT( @@ -237,23 +317,49 @@ static bool cxxParserParseTemplateAngleBrackets(void) if(!cxxParserParseUpToOneOf(CXXTokenTypeClosingBracket | CXXTokenTypeEOF, false)) { CXX_DEBUG_LEAVE_TEXT("Failed to parse up to '}EOF'"); - return false; + return CXXParserParseTemplateAngleBracketsFailed; } cxxParserNewStatement(); CXX_DEBUG_LEAVE_TEXT("Broken template arguments recovery complete"); - return true; + return CXXParserParseTemplateAngleBracketsFailedRecoverable; break; default: CXX_DEBUG_ASSERT(false,"Found unexpected token type 0x%02x",g_cxx.pToken->eType); CXX_DEBUG_LEAVE_TEXT("Found unexpected token type 0x%02x",g_cxx.pToken->eType); - return false; + return CXXParserParseTemplateAngleBracketsFailed; break; } } // never reached - CXX_DEBUG_LEAVE(); - return true; + CXX_DEBUG_LEAVE_TEXT("This should be never reached!"); + return CXXParserParseTemplateAngleBracketsFailed; +} + +// +// Parses the part of a template specification. +// Here we are pointing at the initial <. +// +static bool cxxParserParseTemplateAngleBrackets(void) +{ + CXX_DEBUG_ENTER(); + switch(cxxParserParseTemplateAngleBracketsInternal()) + { + case CXXParserParseTemplateAngleBracketsFailed: + CXX_DEBUG_LEAVE(); + return false; + break; + // TODO: We could signal failure+recovery to upper levels + // so the caller could take recovery actions too. + //case CXXParserParseTemplateAngleBracketsFailedRecoverable: + //case CXXParserParseTemplateAngleBracketsFinishedPrematurely: + //case CXXParserParseTemplateAngleBracketsSucceeded: + default: + CXX_DEBUG_LEAVE(); + return true; + break; + } + CXX_DEBUG_ASSERT(false,"Never here"); } // @@ -286,7 +392,7 @@ bool cxxParserParseTemplateAngleBracketsToSeparateChain(void) g_cxx.pTemplateTokenChain = g_cxx.pTokenChain; g_cxx.pTokenChain = pSave; - + CXX_DEBUG_LEAVE(); return true; } From 9fc990f3eb4a132da814e883bfddabdc3e199770 Mon Sep 17 00:00:00 2001 From: Szymon Tomasz Stefanek Date: Wed, 6 Jun 2018 01:17:52 +0200 Subject: [PATCH 2/2] CXX: Add a template-related unit test that isn't handled correctly by the current parser --- Units/parser-cxx.r/templates4.b/args.ctags | 4 ++++ Units/parser-cxx.r/templates4.b/expected.tags | 2 ++ Units/parser-cxx.r/templates4.b/input.cpp | 4 ++++ 3 files changed, 10 insertions(+) create mode 100644 Units/parser-cxx.r/templates4.b/args.ctags create mode 100644 Units/parser-cxx.r/templates4.b/expected.tags create mode 100644 Units/parser-cxx.r/templates4.b/input.cpp diff --git a/Units/parser-cxx.r/templates4.b/args.ctags b/Units/parser-cxx.r/templates4.b/args.ctags new file mode 100644 index 0000000000..9628bc3bf3 --- /dev/null +++ b/Units/parser-cxx.r/templates4.b/args.ctags @@ -0,0 +1,4 @@ +--sort=no +--extras=+q +--kinds-C++=* +--fields-c++=+{template} \ No newline at end of file diff --git a/Units/parser-cxx.r/templates4.b/expected.tags b/Units/parser-cxx.r/templates4.b/expected.tags new file mode 100644 index 0000000000..8ab82cf4c4 --- /dev/null +++ b/Units/parser-cxx.r/templates4.b/expected.tags @@ -0,0 +1,2 @@ +INT input.cpp /^#define INT /;" d file: +x input.cpp /^template INT x(void) { }$/;" f typeref:typename:INT template: diff --git a/Units/parser-cxx.r/templates4.b/input.cpp b/Units/parser-cxx.r/templates4.b/input.cpp new file mode 100644 index 0000000000..2abdaccc64 --- /dev/null +++ b/Units/parser-cxx.r/templates4.b/input.cpp @@ -0,0 +1,4 @@ +#define INT int + +template INT x(void) { } +