summaryrefslogtreecommitdiff
path: root/doc/tools/coqrst/notations/regexp.py
blob: ea820c719ea4b78077cbb1ab46d0dab1f28df65d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
##########################################################################
##         #   The Coq Proof Assistant / The Coq Development Team       ##
##  v      #   INRIA, CNRS and contributors - Copyright 1999-2018       ##
## <O___,, #       (see CREDITS file for the list of authors)           ##
##   \VV/  ###############################################################
##    //   #    This file is distributed under the terms of the         ##
##         #     GNU Lesser General Public License Version 2.1          ##
##         #     (see LICENSE file for the text of the license)         ##
##########################################################################
"""An experimental visitor for ANTLR notation ASTs, producing regular expressions."""

import re
from io import StringIO

from .parsing import parse
from .TacticNotationsParser import TacticNotationsParser
from .TacticNotationsVisitor import TacticNotationsVisitor

class TacticNotationsToRegexpVisitor(TacticNotationsVisitor):
    def __init__(self):
        self.buffer = StringIO()

    def visitRepeat(self, ctx:TacticNotationsParser.RepeatContext):
        separator = ctx.ATOM()
        repeat_marker = ctx.LGROUP().getText()[1]

        self.buffer.write("(")
        self.visitChildren(ctx)
        self.buffer.write(")")

        if repeat_marker in ["?", "*"]:
            self.buffer.write("?")
        elif repeat_marker in ["+", "*"]:
            self.buffer.write("(")
            self.buffer.write(r"\s*" + re.escape(separator.getText() if separator else " ") + r"\s*")
            self.visitChildren(ctx)
            self.buffer.write(")*")

    def visitCurlies(self, ctx:TacticNotationsParser.CurliesContext):
        self.buffer.write(r"\{")
        self.visitChildren(ctx)
        self.buffer.write(r"\}")

    def visitAtomic(self, ctx:TacticNotationsParser.AtomicContext):
        self.buffer.write(re.escape(ctx.ATOM().getText()))

    def visitHole(self, ctx:TacticNotationsParser.HoleContext):
        self.buffer.write("([^();. \n]+)") # FIXME could allow more things

    def visitMeta(self, ctx:TacticNotationsParser.MetaContext):
        self.buffer.write(re.escape(ctx.METACHAR().getText()[1:]))

    def visitWhitespace(self, ctx:TacticNotationsParser.WhitespaceContext):
        self.buffer.write(r"\s+")

def regexpify(notation):
    """Translate notation to a Python regular expression matching it"""
    vs = TacticNotationsToRegexpVisitor()
    vs.visit(parse(notation))
    return vs.buffer.getvalue()