Author: Haojian Wu
Date: 2022-07-19T09:44:45+02:00
New Revision: d489b3807f096584175c321ce7f20e9dcd49b1da

URL: 
https://github.com/llvm/llvm-project/commit/d489b3807f096584175c321ce7f20e9dcd49b1da
DIFF: 
https://github.com/llvm/llvm-project/commit/d489b3807f096584175c321ce7f20e9dcd49b1da.diff

LOG: [pseudo] Implement a guard to determine function declarator.

This eliminates some simple-declaration/function-definition false
parses.

- implement a function to determine whether a declarator ForestNode is a
  function declarator;
- extend the standard declarator to two guarded function-declarator and
  non-function-declarator nonterminals;

Differential Revision: https://reviews.llvm.org/D129222

Added: 
    

Modified: 
    clang-tools-extra/pseudo/lib/cxx/CXX.cpp
    clang-tools-extra/pseudo/lib/cxx/cxx.bnf
    clang-tools-extra/pseudo/test/cxx/declarator-function.cpp
    clang-tools-extra/pseudo/test/cxx/declarator-var.cpp
    clang-tools-extra/pseudo/test/cxx/recovery-func-parameters.cpp
    clang-tools-extra/pseudo/test/cxx/recovery-init-list.cpp
    clang-tools-extra/pseudo/test/glr.cpp

Removed: 
    


################################################################################
diff  --git a/clang-tools-extra/pseudo/lib/cxx/CXX.cpp 
b/clang-tools-extra/pseudo/lib/cxx/CXX.cpp
index 9a03422153f06..d6c056a25e365 100644
--- a/clang-tools-extra/pseudo/lib/cxx/CXX.cpp
+++ b/clang-tools-extra/pseudo/lib/cxx/CXX.cpp
@@ -46,6 +46,66 @@ bool guardExport(llvm::ArrayRef<const ForestNode *> RHS,
   return Tokens.tokens()[RHS.front()->startTokenIndex()].text() == "export";
 }
 
+bool isFunctionDeclarator(const ForestNode *Declarator) {
+  assert(Declarator->symbol() == (SymbolID)(cxx::Symbol::declarator));
+  bool IsFunction = false;
+  using cxx::Rule;
+  while (true) {
+    // not well-formed code, return the best guess.
+    if (Declarator->kind() != ForestNode::Sequence)
+      return IsFunction;
+
+    switch ((cxx::Rule)Declarator->rule()) {
+    case Rule::noptr_declarator_0declarator_id: // reached the bottom
+      return IsFunction;
+    // *X is a nonfunction (unless X is a function).
+    case Rule::ptr_declarator_0ptr_operator_1ptr_declarator:
+      Declarator = Declarator->elements()[1];
+      IsFunction = false;
+      continue;
+    // X() is a function (unless X is a pointer or similar).
+    case Rule::
+        
declarator_0noptr_declarator_1parameters_and_qualifiers_2trailing_return_type:
+    case Rule::noptr_declarator_0noptr_declarator_1parameters_and_qualifiers:
+      Declarator = Declarator->elements()[0];
+      IsFunction = true;
+      continue;
+    // X[] is an array (unless X is a pointer or function).
+    case Rule::
+        
noptr_declarator_0noptr_declarator_1l_square_2constant_expression_3r_square:
+    case Rule::noptr_declarator_0noptr_declarator_1l_square_2r_square:
+      Declarator = Declarator->elements()[0];
+      IsFunction = false;
+      continue;
+    // (X) is whatever X is.
+    case Rule::noptr_declarator_0l_paren_1ptr_declarator_2r_paren:
+      Declarator = Declarator->elements()[1];
+      continue;
+    case Rule::ptr_declarator_0noptr_declarator:
+    case Rule::declarator_0ptr_declarator:
+      Declarator = Declarator->elements()[0];
+      continue;
+
+    default:
+      assert(false && "unhandled declarator for IsFunction");
+      return IsFunction;
+    }
+  }
+  llvm_unreachable("unreachable");
+}
+bool guardFunction(llvm::ArrayRef<const ForestNode *> RHS,
+                   const TokenStream &Tokens) {
+  assert(RHS.size() == 1 &&
+         RHS.front()->symbol() == (SymbolID)(cxx::Symbol::declarator));
+  return isFunctionDeclarator(RHS.front());
+}
+bool guardNonFunction(llvm::ArrayRef<const ForestNode *> RHS,
+                      const TokenStream &Tokens) {
+  assert(RHS.size() == 1 &&
+         RHS.front()->symbol() == (SymbolID)(cxx::Symbol::declarator));
+  return !isFunctionDeclarator(RHS.front());
+}
+
 llvm::DenseMap<ExtensionID, RuleGuard> buildGuards() {
   return {
       {(ExtensionID)Extension::Override, guardOverride},
@@ -53,6 +113,8 @@ llvm::DenseMap<ExtensionID, RuleGuard> buildGuards() {
       {(ExtensionID)Extension::Import, guardImport},
       {(ExtensionID)Extension::Export, guardExport},
       {(ExtensionID)Extension::Module, guardModule},
+      {(ExtensionID)Extension::FunctionDeclarator, guardFunction},
+      {(ExtensionID)Extension::NonFunctionDeclarator, guardNonFunction},
   };
 }
 

diff  --git a/clang-tools-extra/pseudo/lib/cxx/cxx.bnf 
b/clang-tools-extra/pseudo/lib/cxx/cxx.bnf
index 08384af9d9399..4e434b1e037cc 100644
--- a/clang-tools-extra/pseudo/lib/cxx/cxx.bnf
+++ b/clang-tools-extra/pseudo/lib/cxx/cxx.bnf
@@ -332,7 +332,7 @@ block-declaration := using-directive
 block-declaration := static_assert-declaration
 block-declaration := alias-declaration
 block-declaration := opaque-enum-declaration
-nodeclspec-function-declaration := declarator ;
+nodeclspec-function-declaration := function-declarator ;
 alias-declaration := USING IDENTIFIER = defining-type-id ;
 simple-declaration := decl-specifier-seq init-declarator-list_opt ;
 simple-declaration := decl-specifier-seq ref-qualifier_opt [ identifier-list ] 
initializer ;
@@ -402,8 +402,19 @@ placeholder-type-specifier := type-constraint_opt AUTO
 placeholder-type-specifier := type-constraint_opt DECLTYPE ( AUTO )
 init-declarator-list := init-declarator
 init-declarator-list := init-declarator-list , init-declarator
-init-declarator := declarator initializer_opt
-init-declarator := declarator requires-clause
+#! The standard grammar allows:
+#!   1) an initializer with any declarator, including a function declarator, 
this
+#!      creates an ambiguity where a function definition is misparsed as a 
simple
+#!      declaration;
+#!   2) an function-body with any declarator, includeing a non-function
+#!      declarator, this creates an ambiguity whwere a simple-declaration is
+#!      misparsed as a function-definition;
+#! We extend the standard declarator to function-declarator and 
non-function-declarator
+#! to eliminate these false parses.
+init-declarator := non-function-declarator initializer_opt
+init-declarator := function-declarator requires-clause_opt
+function-declarator := declarator [guard=FunctionDeclarator]
+non-function-declarator := declarator [guard=NonFunctionDeclarator]
 declarator := ptr-declarator
 declarator := noptr-declarator parameters-and-qualifiers trailing-return-type
 ptr-declarator := noptr-declarator
@@ -472,8 +483,8 @@ designator := [ expression ]
 expr-or-braced-init-list := expression
 expr-or-braced-init-list := braced-init-list
 # dcl.fct
-function-definition := decl-specifier-seq_opt declarator 
virt-specifier-seq_opt function-body
-function-definition := decl-specifier-seq_opt declarator requires-clause 
function-body
+function-definition := decl-specifier-seq_opt function-declarator 
virt-specifier-seq_opt function-body
+function-definition := decl-specifier-seq_opt function-declarator 
requires-clause function-body
 function-body := ctor-initializer_opt compound-statement
 function-body := function-try-block
 function-body := = DEFAULT ;

diff  --git a/clang-tools-extra/pseudo/test/cxx/declarator-function.cpp 
b/clang-tools-extra/pseudo/test/cxx/declarator-function.cpp
index 59dccf993af47..4d7972807c6db 100644
--- a/clang-tools-extra/pseudo/test/cxx/declarator-function.cpp
+++ b/clang-tools-extra/pseudo/test/cxx/declarator-function.cpp
@@ -1,11 +1,9 @@
 // The standard grammar allows an init-list with any declarator, including
 // a function declarator. This creates an ambiguity where a function-definition
 // is misparsed as a simple-declaration.
-// FIXME: eliminate this false parse.
-// XFAIL: *
 
 // RUN: clang-pseudo -grammar=cxx -source=%s --print-forest | FileCheck %s
 void s(){};
 // CHECK-NOT:      simple-declaration
-// CHECK:          function-definition := decl-specifier-seq declarator
-// function-body CHECK-NOT:      simple-declaration
+// CHECK:          function-definition := decl-specifier-seq 
function-declarator function-body
+// CHECK-NOT:      simple-declaration

diff  --git a/clang-tools-extra/pseudo/test/cxx/declarator-var.cpp 
b/clang-tools-extra/pseudo/test/cxx/declarator-var.cpp
index 057ec55b1c925..5aedd8037513f 100644
--- a/clang-tools-extra/pseudo/test/cxx/declarator-var.cpp
+++ b/clang-tools-extra/pseudo/test/cxx/declarator-var.cpp
@@ -1,11 +1,9 @@
 // The standard grammar allows an function-body to use any declarator, 
including
 // a non-function declarator. This creates an ambiguity where a
 // simple-declaration is misparsed as a function-definition.
-// FIXME: eliminate this false parse.
-// XFAIL: *
 
 // RUN: clang-pseudo -grammar=cxx -source=%s --print-forest | FileCheck %s
 void (*s)(){};
 // CHECK-NOT:      function-definition
-// CHECK:          init-declarator := declarator initializer
+// CHECK:          init-declarator := non-function-declarator initializer
 // CHECK-NOT:      function-definition

diff  --git a/clang-tools-extra/pseudo/test/cxx/recovery-func-parameters.cpp 
b/clang-tools-extra/pseudo/test/cxx/recovery-func-parameters.cpp
index d3007c3fb4bc6..0b41f881fa3bf 100644
--- a/clang-tools-extra/pseudo/test/cxx/recovery-func-parameters.cpp
+++ b/clang-tools-extra/pseudo/test/cxx/recovery-func-parameters.cpp
@@ -1,8 +1,8 @@
 // RUN: clang-pseudo -grammar=cxx -source=%s --print-forest | FileCheck %s
 void foo(complete garbage???) {}
-// CHECK:      translation-unit~function-definition := decl-specifier-seq 
declarator function-body
+// CHECK:      translation-unit~function-definition := decl-specifier-seq 
function-declarator function-body
 // CHECK-NEXT: ├─decl-specifier-seq~VOID := tok[0]
-// CHECK-NEXT: ├─declarator~noptr-declarator := noptr-declarator 
parameters-and-qualifiers
+// CHECK-NEXT: ├─function-declarator~noptr-declarator := noptr-declarator 
parameters-and-qualifiers
 // CHECK-NEXT: │ ├─noptr-declarator~IDENTIFIER := tok[1]
 // CHECK-NEXT: │ └─parameters-and-qualifiers := ( parameter-declaration-clause 
[recover=Brackets] )
 // CHECK-NEXT: │   ├─( := tok[2]

diff  --git a/clang-tools-extra/pseudo/test/cxx/recovery-init-list.cpp 
b/clang-tools-extra/pseudo/test/cxx/recovery-init-list.cpp
index 283c53d78128d..38216ad964772 100644
--- a/clang-tools-extra/pseudo/test/cxx/recovery-init-list.cpp
+++ b/clang-tools-extra/pseudo/test/cxx/recovery-init-list.cpp
@@ -3,7 +3,7 @@ auto x = { complete garbage };
 // CHECK:      translation-unit~simple-declaration
 // CHECK-NEXT: ├─decl-specifier-seq~AUTO := tok[0]
 // CHECK-NEXT: ├─init-declarator-list~init-declarator
-// CHECK-NEXT: │ ├─declarator~IDENTIFIER := tok[1]
+// CHECK-NEXT: │ ├─non-function-declarator~IDENTIFIER := tok[1]
 // CHECK-NEXT: │ └─initializer~brace-or-equal-initializer
 // CHECK-NEXT: │   ├─= := tok[2]
 // CHECK-NEXT: │   └─initializer-clause~braced-init-list

diff  --git a/clang-tools-extra/pseudo/test/glr.cpp 
b/clang-tools-extra/pseudo/test/glr.cpp
index 0eb19fba2ecc6..24b2ac05f6f1b 100644
--- a/clang-tools-extra/pseudo/test/glr.cpp
+++ b/clang-tools-extra/pseudo/test/glr.cpp
@@ -1,4 +1,4 @@
-// RUN: clang-pseudo -grammar=%cxx-bnf-file -source=%s --print-forest 
-print-statistics | FileCheck %s
+// RUN: clang-pseudo -grammar=cxx -source=%s --print-forest -print-statistics 
| FileCheck %s
 
 void foo() {
   T* a; // a multiply expression or a pointer declaration?


        
_______________________________________________
cfe-commits mailing list
cfe-commits@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

Reply via email to