cucumber · shivam-sehgal · Jul 8, 2023 · Jul 9, 2023 · Jul 9, 2023 · Jul 9, 2023
diff --git a/java/src/main/java/io/cucumber/tagexpressions/TagExpressionParser.java b/java/src/main/java/io/cucumber/tagexpressions/TagExpressionParser.java
@@ -10,6 +10,8 @@
 import java.util.regex.Pattern;
 
 public final class TagExpressionParser {
+    //regex for token to ensure no token has ',' in them later can be customized further
+    private final static String VALID_TOKEN = "^(?:@[^@]*|and|or|not|\\(|\\))$";
     private static final Map<String, Assoc> ASSOC = new HashMap<String, Assoc>() {{
         put("or", Assoc.LEFT);
         put("and", Assoc.LEFT);
@@ -106,6 +108,7 @@ private static List<String> tokenize(String expr) {
                 isEscaped = true;
             } else if (c == '(' || c == ')' || Character.isWhitespace(c)) {
                 if (token.length() > 0) {
+                    isTokenValid(token,expr);
                     tokens.add(token.toString());
                     token = new StringBuilder();
                 }
@@ -116,12 +119,28 @@ private static List<String> tokenize(String expr) {
                 token.append(c);
             }
         }
-        if (token.length() > 0) {
+        if (token.length() > 0)  {
+            isTokenValid(token,expr);
             tokens.add(token.toString());
         }
         return tokens;
     }
 
+    /**
+     * this method checks if the token comply with the req
+     * regex if not throws exception
+     * @param token supposed tag or operator of the expresiion
+     * @param expr entire expression
+     */
+    private static void isTokenValid(StringBuilder token,String expr){
+
+        if(token.length()>0&&!String.valueOf(token).matches(VALID_TOKEN)){
+            throw new TagExpressionException("Tag expression \"%s\" could not be parsed because of syntax error: Please adhere to the Gherkin tag naming convention, using tags like \"@tag1\" and avoiding more than one \"@\" in the tag name.",
+             expr);
+        }
+
+    }
+
     private void check(TokenType expectedTokenType, TokenType tokenType) {
         if (expectedTokenType != tokenType) {
             throw new TagExpressionException("Tag expression \"%s\" could not be parsed because of syntax error: Expected %s.", infix, expectedTokenType.toString().toLowerCase());

diff --git a/javascript/src/index.ts b/javascript/src/index.ts
@@ -12,6 +12,7 @@ const ASSOC: { [key: string]: string } = {
   and: 'left',
   not: 'right',
 }
+const VALID_TOKEN = /(?:@[^@]*|and|or|not|/(|/))$/;
 
 /**
  * Parses infix boolean expression (using Dijkstra's Shunting Yard algorithm)
@@ -109,6 +110,7 @@ function tokenize(expr: string): string[] {
       isEscaped = true
     } else if (c === '(' || c === ')' || /\s/.test(c)) {
       if (token.length > 0) {
+        isTokenValid(token,expr);
         tokens.push(token.join(''))
         token = []
       }
@@ -120,11 +122,20 @@ function tokenize(expr: string): string[] {
     }
   }
   if (token.length > 0) {
+    isTokenValid(token,expr);
     tokens.push(token.join(''))
   }
   return tokens
 }
 
+function isTokenValid(token: string[], expr: string): void {
+  if (!token.toString().match(VALID_TOKEN)) {
+    throw new Error(
+      `Tag expression "${expr}" could not be parsed because of syntax error: An invalid tag combination operator was detected. The use of a comma (",") to combine tags is not supported. Please replace it with either the "or" or "and" operators for tag combinations. For example, use "@tag1 or @tag2" or "@tag1 and @tag2"`
+    );
+  }
+}
+
 function isUnary(token: string) {
   return 'not' === token
 }

diff --git a/ruby/lib/cucumber/tag_expressions/parser.rb b/ruby/lib/cucumber/tag_expressions/parser.rb
@@ -7,6 +7,7 @@ class Parser
       def initialize
         @expressions = []
         @operators = []
+        @valid_token = /^(?:@[^@]*|and|or|not|\(|\))$/
 
         @operator_types = {
           'or'  => { type: :binary_operator,    precedence: 0, assoc: :left },
@@ -80,6 +81,7 @@ def tokenize(infix_expression)
             escaped = true
           elsif ch == '(' || ch == ')' || ch.match(/\s/)
             if token.length > 0
+              is_token_valid(token,infix_expression)
               tokens.push(token)
               token = ""
             end
@@ -91,11 +93,18 @@ def tokenize(infix_expression)
           end
         end
         if token.length > 0
+          is_token_valid(token,infix_expression)
           tokens.push(token)
         end
         tokens
       end
 
+      def is_token_valid(token, expr)
+        unless token.to_s.match?(@valid_token)
+          raise %Q{Tag expression "#{expr}" could not be parsed because of syntax error: Please adhere to the Gherkin tag naming convention, using tags like \"@tag1\" and avoiding more than one \"@\" in the tag name.}
+        end
+      end
+
       def push_expression(token)
         case token
         when 'and'

diff --git a/testdata/errors.yml b/testdata/errors.yml
@@ -6,17 +6,21 @@
   error: 'Tag expression "@a and (@b @c) or" could not be parsed because of syntax error: Expected operator.'
 - expression: '@a and or'
   error: 'Tag expression "@a and or" could not be parsed because of syntax error: Expected operand.'
+- expression: '@a,@b'
+  error: 'Tag expression "@a,@b" could not be parsed because of syntax error: Please adhere to the Gherkin tag naming convention, using tags like "@tag1" and avoiding more than one "@" in the tag name.'
+- expression: '(@a ,@b)'
+  error: 'Tag expression "(@a ,@b)" could not be parsed because of syntax error: Please adhere to the Gherkin tag naming convention, using tags like "@tag1" and avoiding more than one "@" in the tag name.'
 - expression: 'or or'
   error: 'Tag expression "or or" could not be parsed because of syntax error: Expected operand.'
-- expression: 'a and or'
-  error: 'Tag expression "a and or" could not be parsed because of syntax error: Expected operand.'
-- expression: 'a b'
-  error: 'Tag expression "a b" could not be parsed because of syntax error: Expected operator.'
-- expression: '( a and b ) )'
-  error: 'Tag expression "( a and b ) )" could not be parsed because of syntax error: Unmatched ).'
-- expression: '( ( a and b )'
-  error: 'Tag expression "( ( a and b )" could not be parsed because of syntax error: Unmatched (.'
-- expression: 'x or \y or z'
-  error: 'Tag expression "x or \y or z" could not be parsed because of syntax error: Illegal escape before "y".'
-- expression: 'x\ or y'
-  error: 'Tag expression "x\ or y" could not be parsed because of syntax error: Expected operator.'
+- expression: '@a and or'
+  error: 'Tag expression "@a and or" could not be parsed because of syntax error: Expected operand.'
+- expression: '@a @b'
+  error: 'Tag expression "@a @b" could not be parsed because of syntax error: Expected operator.'
+- expression: '( @a and @b ) )'
+  error: 'Tag expression "( @a and @b ) )" could not be parsed because of syntax error: Unmatched ).'
+- expression: '( ( @a and @b )'
+  error: 'Tag expression "( ( @a and @b )" could not be parsed because of syntax error: Unmatched (.'
+- expression: '@x or @\y or @z'
+  error: 'Tag expression "@x or @\y or @z" could not be parsed because of syntax error: Illegal escape before "y".'
+- expression: '@x\ or @y'
+  error: 'Tag expression "@x\ or @y" could not be parsed because of syntax error: Expected operator.'
diff --git a/testdata/evaluations.yml b/testdata/evaluations.yml
@@ -1,59 +1,59 @@
-- expression: 'not x'
+- expression: 'not @x'
   tests:
-    - variables: ['x']
+    - variables: ['@x']
       result: false
-    - variables: ['y']
+    - variables: ['@y']
       result: true
-- expression: 'x and y'
+- expression: '@x and @y'
   tests:
-    - variables: ['x', 'y']
+    - variables: ['@x', '@y']
       result: true
-    - variables: ['x']
+    - variables: ['@x']
       result: false
-    - variables: ['y']
+    - variables: ['@y']
       result: false
 
-- expression: 'x or y'
+- expression: '@x or @y'
   tests:
     - variables: []
       result: false
-    - variables: ['x', 'y']
+    - variables: ['@x', '@y']
       result: true
-    - variables: ['x']
+    - variables: ['@x']
       result: true
-    - variables: ['y']
+    - variables: ['@y']
       result: true
-- expression: 'x\(1\) or y\(2\)'
+- expression: '@x\(1\) or @y\(2\)'
   tests:
-    - variables: ['x(1)']
+    - variables: ['@x(1)']
       result: true
-    - variables: ['y(2)']
+    - variables: ['@y(2)']
       result: true
-- expression: 'x\\ or y\\\) or z\\'
+- expression: '@x\\ or @y\\\) or @z\\'
   tests:
-    - variables: ['x\']
+    - variables: ['@x\']
       result: true
-    - variables: ['y\)']
+    - variables: ['@y\)']
       result: true
-    - variables: ['z\']
+    - variables: ['@z\']
       result: true
-    - variables: ['x']
+    - variables: ['@x']
       result: false
-    - variables: ['y)']
+    - variables: ['@y)']
       result: false
-    - variables: ['z']
+    - variables: ['@z']
       result: false
-- expression: '\\x or y\\ or z\\'
+- expression: '@\\x or @y\\ or @z\\'
   tests:
-    - variables: ['\x']
+    - variables: ['@\x']
       result: true
-    - variables: ['y\']
+    - variables: ['@y\']
       result: true
-    - variables: ['z\']
+    - variables: ['@z\']
       result: true
-    - variables: ['x']
+    - variables: ['@x']
       result: false
-    - variables: ['y']
+    - variables: ['@y']
       result: false
-    - variables: ['z']
+    - variables: ['@z']
       result: false
diff --git a/testdata/parsing.yml b/testdata/parsing.yml
@@ -1,48 +1,46 @@
-- expression: ''
-  formatted: 'true'
-- expression: 'a and b'
-  formatted: '( a and b )'
-- expression: 'a or b'
-  formatted: '( a or b )'
-- expression: 'not a'
-  formatted: 'not ( a )'
-- expression: 'a and b and c'
-  formatted: '( ( a and b ) and c )'
-- expression: '( a and b ) or ( c and d )'
-  formatted: '( ( a and b ) or ( c and d ) )'
-- expression: 'not a or b and not c or not d or e and f'
-  formatted: '( ( ( not ( a ) or ( b and not ( c ) ) ) or not ( d ) ) or ( e and f ) )'
-- expression: 'not a\(\) or b and not c or not d or e and f'
-  formatted: '( ( ( not ( a\(\) ) or ( b and not ( c ) ) ) or not ( d ) ) or ( e and f ) )'
+- expression: '@a and @b'
+  formatted: '( @a and @b )'
+- expression: '@a or @b'
+  formatted: '( @a or @b )'
+- expression: 'not @a'
+  formatted: 'not ( @a )'
+- expression: '@a and @b and @c'
+  formatted: '( ( @a and @b ) and @c )'
+- expression: '( @a and @b ) or ( @c and @d )'
+  formatted: '( ( @a and @b ) or ( @c and @d ) )'
+- expression: 'not @a or @b and not @c or not @d or @e and @f'
+  formatted: '( ( ( not ( @a ) or ( @b and not ( @c ) ) ) or not ( @d ) ) or ( @e and @f ) )'
+- expression: 'not @a\(\) or @b and not @c or not @d or @e and @f'
+  formatted: '( ( ( not ( @a\(\) ) or ( @b and not ( @c ) ) ) or not ( @d ) ) or ( @e and @f ) )'
 
-- expression: 'not (a and b)'
-  formatted: 'not ( a and b )'
-- expression: 'not (a or b)'
-  formatted: 'not ( a or b )'
-- expression: 'not (a and b) and c or not (d or f)'
-  formatted: '( ( not ( a and b ) and c ) or not ( d or f ) )'
+- expression: 'not (@a and @b)'
+  formatted: 'not ( @a and @b )'
+- expression: 'not (@a or @b)'
+  formatted: 'not ( @a or @b )'
+- expression: 'not (@a and @b) and @c or not (@d or @f)'
+  formatted: '( ( not ( @a and @b ) and @c ) or not ( @d or @f ) )'
 
-- expression: 'a\\ and b'
-  formatted: '( a\\ and b )'
-- expression: '\\a and b'
-  formatted: '( \\a and b )'
-- expression: 'a\\ and b'
-  formatted: '( a\\ and b )'
-- expression: 'a and b\\'
-  formatted: '( a and b\\ )'
-- expression: '( a and b\\\\)'
-  formatted: '( a and b\\\\ )'
-- expression: 'a\\\( and b\\\)'
-  formatted: '( a\\\( and b\\\) )'
-- expression: '(a and \\b)'
-  formatted: '( a and \\b )'
-- expression: 'x or(y) '
-  formatted: '( x or y )'
-- expression: 'x\(1\) or(y\(2\))'
-  formatted: '( x\(1\) or y\(2\) )'
-- expression: '\\x or y\\ or z\\'
-  formatted: '( ( \\x or y\\ ) or z\\ )'
-- expression: 'x\\ or(y\\\)) or(z\\)'
-  formatted: '( ( x\\ or y\\\) ) or z\\ )'
-- expression: 'x\  or y'
-  formatted: '( x\  or y )'
+- expression: '@a\\ and @b'
+  formatted: '( @a\\ and @b )'
+- expression: '@\\a and @b'
+  formatted: '( @\\a and @b )'
+- expression: '@a\\ and @b'
+  formatted: '( @a\\ and @b )'
+- expression: '@a and @b\\'
+  formatted: '( @a and @b\\ )'
+- expression: '( @a and @b\\\\)'
+  formatted: '( @a and @b\\\\ )'
+- expression: '@a\\\( and @b\\\)'
+  formatted: '( @a\\\( and @b\\\) )'
+- expression: '(@a and @\\b)'
+  formatted: '( @a and @\\b )'
+- expression: '@x or(@y) '
+  formatted: '( @x or @y )'
+- expression: '@x\(1\) or(@y\(2\))'
+  formatted: '( @x\(1\) or @y\(2\) )'
+- expression: '@\\x or @y\\ or @z\\'
+  formatted: '( ( @\\x or @y\\ ) or @z\\ )'
+- expression: '@x\\ or(@y\\\)) or(@z\\)'
+  formatted: '( ( @x\\ or @y\\\) ) or @z\\ )'
+- expression: '@x\  or @y'
+  formatted: '( @x\  or @y )'