2020-01-03 01:38:49 +03:00
|
|
|
-- (C) Dmitry Boulytchev, St. Petersburg State University, JetBrains Research, 2020
|
|
|
|
|
-- Matcher: simple string matching library.
|
2019-12-31 00:59:28 +03:00
|
|
|
|
2020-01-03 01:38:49 +03:00
|
|
|
-- Create a regular expression representation.
|
|
|
|
|
-- Arguments:
|
|
|
|
|
-- r --- a string representation for regular expression (as per GNU regexp)
|
|
|
|
|
-- name --- a string describing the meaning of the expression in free form
|
|
|
|
|
-- (e.g. "identifier", "string constant", etc.), used for error
|
|
|
|
|
-- reporting
|
2020-01-14 17:08:35 +03:00
|
|
|
public fun createRegexp (r, name) {
|
2020-01-05 03:46:19 +03:00
|
|
|
[regexp (r), name]
|
2020-01-03 01:38:49 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
-- Create an immutable matcher.
|
|
|
|
|
-- Arguments:
|
|
|
|
|
-- buf --- a string to match in
|
|
|
|
|
-- pos --- an integer beginning position to match from
|
|
|
|
|
-- line, col --- line and column numbers
|
|
|
|
|
-- This function is internal, do not use it directly.
|
|
|
|
|
-- To initially create a matcher use initMatcher function (see below).
|
|
|
|
|
fun matcherCreate (buf, pos, line, col) {
|
|
|
|
|
-- Shows a matcher in a readable form
|
2019-12-31 00:59:28 +03:00
|
|
|
fun show () {
|
2020-01-05 03:46:19 +03:00
|
|
|
sprintf ("buf : %-40s\npos : %d\nline: %d\ncol : %d\n", buf, pos, line, col)
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
2020-01-03 01:38:49 +03:00
|
|
|
|
|
|
|
|
-- Calculates the number of remaining unmatched characters in the buffer
|
2019-12-31 00:59:28 +03:00
|
|
|
fun rest () {
|
2020-01-05 03:46:19 +03:00
|
|
|
buf.length - pos
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
2020-01-03 01:38:49 +03:00
|
|
|
|
2020-01-04 21:50:14 +03:00
|
|
|
-- Moves the position pointer on given number of characters.
|
2019-12-31 00:59:28 +03:00
|
|
|
fun shift (n) {
|
2020-01-04 21:50:14 +03:00
|
|
|
local i, l = line, c = col;
|
|
|
|
|
|
|
|
|
|
for i := pos, i < n, i := i+1 do
|
|
|
|
|
case buf [i] of
|
|
|
|
|
'\n' -> l := l + 1; c := 1
|
|
|
|
|
| '\t' -> c := c + 8
|
|
|
|
|
| _ -> c := c + 1
|
|
|
|
|
esac
|
|
|
|
|
od;
|
|
|
|
|
|
2020-01-05 03:46:19 +03:00
|
|
|
matcherCreate (buf, pos + n, l, c)
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
2020-01-03 01:38:49 +03:00
|
|
|
|
2019-12-31 00:59:28 +03:00
|
|
|
fun matchString (s) {
|
2020-01-05 03:46:19 +03:00
|
|
|
if s.length > rest ()
|
|
|
|
|
then Fail (sprintf ("""%s"" expected at %d:%d", s, line, col))
|
|
|
|
|
elif matchSubString (buf, s, pos) then Succ (shift (s.length), s)
|
|
|
|
|
else Fail (sprintf ("""%s"" expected at %d:%d", s, line, col))
|
|
|
|
|
fi
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-03 01:38:49 +03:00
|
|
|
fun matchRegexp (r) {
|
|
|
|
|
local n;
|
|
|
|
|
|
2020-01-05 03:46:19 +03:00
|
|
|
if (n := regexpMatch (r[0], buf, pos)) > 0
|
|
|
|
|
then Succ (shift (n), substring (buf, pos, n))
|
|
|
|
|
else Fail (sprintf ("%s expected at %d:%d", r[1], line, col))
|
|
|
|
|
fi
|
2020-01-03 01:38:49 +03:00
|
|
|
}
|
2020-01-04 21:50:14 +03:00
|
|
|
|
2019-12-31 00:59:28 +03:00
|
|
|
fun eof () {
|
2020-01-05 03:46:19 +03:00
|
|
|
rest () == 0
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-05 03:46:19 +03:00
|
|
|
[show,
|
|
|
|
|
eof,
|
|
|
|
|
matchString,
|
2020-01-05 22:54:09 +03:00
|
|
|
matchRegexp]
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-14 17:08:35 +03:00
|
|
|
public fun show (m) {
|
2020-01-05 03:46:19 +03:00
|
|
|
m [0] ()
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-14 17:08:35 +03:00
|
|
|
public fun endOf (m) {
|
2020-01-05 03:46:19 +03:00
|
|
|
m [1] ()
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-14 17:08:35 +03:00
|
|
|
public fun matchString (m, s) {
|
2020-01-05 03:46:19 +03:00
|
|
|
m [2] (s)
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-04 21:50:14 +03:00
|
|
|
-- Matches against a regexp
|
2020-01-14 17:08:35 +03:00
|
|
|
public fun matchRegexp (m, r) {
|
2020-01-05 03:46:19 +03:00
|
|
|
m [3] (r)
|
2020-01-03 01:38:49 +03:00
|
|
|
}
|
|
|
|
|
|
2020-01-04 21:50:14 +03:00
|
|
|
-- Creates a fresh matcher from a string buffer
|
|
|
|
|
public fun matcherInit (buf) {
|
2020-01-05 03:46:19 +03:00
|
|
|
matcherCreate (buf, 0, 1, 1)
|
2019-12-31 00:59:28 +03:00
|
|
|
}
|