alecthomas · alecthomas · Sep 7, 2020 · Sep 5, 2020 · alecthomas · Sep 7, 2020
diff --git a/README.md b/README.md
@@ -106,6 +106,7 @@ err := parser.ParseString("size = 10", ast)
 - `"...":<identifier>` Match the literal, specifying the exact lexer token type to match.
 - `<expr> <expr> ...` Match expressions.
 - `<expr> | <expr>` Match one of the alternatives.
+- `!<expr>` Match any token that is not the start of the expression (eg: `@!";"` matches anything but the `;` character into the field).
 
 The following modifiers can be used after any expression:
 
@@ -202,8 +203,8 @@ The best combination of speed, flexibility and usability is `lexer/regex.New()`.
 
 Ordered by speed they are:
 
-1. `lexer.DefaultDefinition` is based on the 
-   [text/scanner](https://golang.org/pkg/text/scanner/) package and only allows 
+1. `lexer.DefaultDefinition` is based on the
+   [text/scanner](https://golang.org/pkg/text/scanner/) package and only allows
    tokens provided by that package. This is the default lexer.
 2. `lexer.Regexp()` (legacy) maps regular expression named subgroups to lexer symbols.
 3. `lexer/regex.New()` is a more readable regex lexer, with each rule in the form `<name> = <regex>`.
@@ -372,7 +373,7 @@ There are a few areas where Participle can provide useful feedback to users of y
 2. Participle will make a best effort to return as much of the AST up to the error location as possible.
 3. Any node in the AST containing a field `Pos lexer.Position` or `Tok lexer.Token` will be automatically
    populated from the nearest matching token.
-4. Any node in the AST containing a field `EndPos lexer.Position` or `EndTok lexer.Token` will be 
+4. Any node in the AST containing a field `EndPos lexer.Position` or `EndTok lexer.Token` will be
    automatically populated with the token at the end of the node.
 
 These related pieces of information can be combined to provide fairly comprehensive error reporting.
diff --git a/grammar.go b/grammar.go
@@ -139,6 +139,8 @@ func (g *generatorContext) parseTermNoModifiers(slexer *structLexer) (node, erro
 		out, err = g.parseCapture(slexer)
 	case scanner.String, scanner.RawString, scanner.Char:
 		out, err = g.parseLiteral(slexer)
+	case '!':
+		return g.parseNegation(slexer)
 	case '[':
 		return g.parseOptional(slexer)
 	case '{':
@@ -282,6 +284,18 @@ func (g *generatorContext) parseGroup(slexer *structLexer) (node, error) {
 	return &group{expr: disj}, nil
 }
 
+// A token negation
+//
+// Accepts both the form !"some-literal" and !SomeNamedToken
+func (g *generatorContext) parseNegation(slexer *structLexer) (node, error) {
+	_, _ = slexer.Next() // advance the parser since we have '!' right now.
+	next, err := g.parseTermNoModifiers(slexer)
+	if err != nil {
+		return nil, err
+	}
+	return &negation{next}, nil
+}
+
 // A literal string.
 //
 // Note that for this to match, the tokeniser must be able to produce this string. For example,

diff --git a/nodes.go b/nodes.go
@@ -412,6 +412,40 @@ func (l *literal) Parse(ctx *parseContext, parent reflect.Value) (out []reflect.
 	return nil, nil
 }
 
+type negation struct {
+	node node
+}
+
+func (n *negation) String() string { return "!" + stringer(n.node) }
+
+func (n *negation) Parse(ctx *parseContext, parent reflect.Value) (out []reflect.Value, err error) {
+	// Create a branch to avoid advancing the parser, but call neither Stop nor Accept on it
+	// since we will discard a match.
+	branch := ctx.Branch()
+	notEOF, err := ctx.Peek(0)
+	if err != nil {
+		return nil, err
+	}
+	if notEOF.EOF() {
+		// EOF cannot match a negation, which expects something
+		return nil, nil
+	}
+
+	out, err = n.node.Parse(branch, parent)
+
+	if out != nil && err == nil {
+		// out being non-nil means that what we don't want is actually here, so we report nomatch
+		return nil, lexer.ErrorWithTokenf(notEOF, "unexpected '%s'", notEOF.Value)
+	}
+
+	// Just give the next token
+	next, err := ctx.Next()
+	if err != nil {
+		return nil, err
+	}
+	return []reflect.Value{reflect.ValueOf(next.Value)}, nil
+}
+
 // Attempt to transform values to given type.
 //
 // This will dereference pointers, and attempt to parse strings into integer values, floats, etc.

diff --git a/parser_test.go b/parser_test.go
@@ -1212,3 +1212,57 @@ func TestPointerToList(t *testing.T) {
 // 	require.NoError(t, err)
 // 	require.NotNil(t, ast.List)
 // }
+
+func TestNegation(t *testing.T) {
+	type grammar struct {
+		EverythingUntilSemicolon *[]string `@!';'* @';'`
+	}
+	p := mustTestParser(t, &grammar{})
+	ast := &grammar{}
+	err := p.ParseString(`hello world ;`, ast)
+	require.NoError(t, err)
+	require.Equal(t, &[]string{"hello", "world", ";"}, ast.EverythingUntilSemicolon)
+
+	err = p.ParseString(`hello world`, ast)
+	require.Error(t, err)
+}
+
+func TestNegationWithPattern(t *testing.T) {
+	type grammar struct {
+		EverythingMoreComplex *[]string `@!(';' String)* @';' @String`
+	}
+
+	p := mustTestParser(t, &grammar{})
+	// j, err := json.MarshalIndent(p.root, "", "  ")
+	// log.Print(j)
+	// log.Print(stringer(p.root))
+	ast := &grammar{}
+	err := p.ParseString(`hello world ; 'some-str'`, ast)
+	require.NoError(t, err)
+	require.Equal(t, &[]string{"hello", "world", ";", `some-str`}, ast.EverythingMoreComplex)
+
+	err = p.ParseString(`hello ; world ; 'hey'`, ast)
+	require.NoError(t, err)
+	require.Equal(t, &[]string{"hello", ";", "world", ";", `hey`}, ast.EverythingMoreComplex)
+
+	err = p.ParseString(`hello ; world ;`, ast)
+	require.Error(t, err)
+}
+
+func TestNegationWithDisjunction(t *testing.T) {
+	type grammar struct {
+		EverythingMoreComplex *[]string `@!(';' | ',')* @(';' | ',')`
+	}
+
+	// Note: we need more lookahead since (';' String) needs some before failing to match
+	p := mustTestParser(t, &grammar{})
+	ast := &grammar{}
+	err := p.ParseString(`hello world ;`, ast)
+	require.NoError(t, err)
+	require.Equal(t, &[]string{"hello", "world", ";"}, ast.EverythingMoreComplex)
+
+	err = p.ParseString(`hello world , `, ast)
+	require.NoError(t, err)
+	require.Equal(t, &[]string{"hello", "world", ","}, ast.EverythingMoreComplex)
+
+}
diff --git a/stringer.go b/stringer.go
@@ -90,6 +90,17 @@ func (s *stringerVisitor) visit(n node, depth int) { // nolint: gocognit
 		}
 		fmt.Fprint(s, "*")
 
+	case *negation:
+		fmt.Fprintf(s, "!")
+		composite := compositeNode(map[node]bool{}, n)
+		if composite {
+			fmt.Fprint(s, "(")
+		}
+		s.visit(n.node, depth)
+		if composite {
+			fmt.Fprint(s, ")")
+		}
+
 	case *literal:
 		fmt.Fprintf(s, "%q", n.s)
 		if n.t != lexer.EOF && n.s == "" {
@@ -153,6 +164,9 @@ func compositeNode(seen map[node]bool, n node) bool {
 	case *reference, *literal, *parseable:
 		return false
 
+	case *negation:
+		return compositeNode(seen, n.node)
+
 	case *strct:
 		return compositeNode(seen, n.expr)