1
0
mirror of https://github.com/janet-lang/janet synced 2024-12-23 15:00:27 +00:00

Add some more tests, add parameterized captures to patterns,

and fix some bugs.
This commit is contained in:
Calvin Rose 2019-01-12 11:04:47 -05:00
parent d7626f8c57
commit 83f4a11bf3
3 changed files with 51 additions and 11 deletions

View File

@ -46,6 +46,7 @@ Janet makes a good system scripting language, or a language to embed in other pr
* Lexical scoping * Lexical scoping
* Imperative programming as well as functional * Imperative programming as well as functional
* REPL * REPL
* Parsing Expression Grammars built in to the core library
* 300+ functions and macros in the core library * 300+ functions and macros in the core library
* Interactive environment with detailed stack traces * Interactive environment with detailed stack traces

View File

@ -42,6 +42,8 @@ typedef struct {
JanetTable *grammar; JanetTable *grammar;
JanetArray *captures; JanetArray *captures;
JanetBuffer *scratch; JanetBuffer *scratch;
const Janet *extrav;
int32_t extrac;
int flags; int flags;
} State; } State;
@ -124,7 +126,6 @@ static int32_t match_choice(State *s, int32_t argc, const Janet *argv, const uin
static int32_t match_sequence(State *s, int32_t argc, const Janet *argv, const uint8_t *text) { static int32_t match_sequence(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
int32_t traversed = 0; int32_t traversed = 0;
for (int32_t i = 0; i < argc; i++) { for (int32_t i = 0; i < argc; i++) {
if (text + traversed >= s->text_end) return -1;
int32_t result = match(s, argv[i], text + traversed); int32_t result = match(s, argv[i], text + traversed);
if (result < 0) return -1; if (result < 0) return -1;
traversed += result; traversed += result;
@ -259,6 +260,14 @@ static int32_t match_capture_constant(State *s, int32_t argc, const Janet *argv,
return 0; return 0;
} }
/* Capture nth extra argument to peg/match */
static int32_t match_capture_arg(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
janet_fixarity(argc, 1);
int32_t n = janet_gethalfrange(argv, 0, s->extrac, "n");
push_capture(s, s->extrav[n], text, 0);
return 0;
}
/* Capture replace */ /* Capture replace */
static int32_t match_replace(State *s, int32_t argc, const Janet *argv, const uint8_t *text) { static int32_t match_replace(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
janet_fixarity(argc, 2); janet_fixarity(argc, 2);
@ -319,6 +328,7 @@ static const MatcherPair specials[] = {
{"-", match_minus}, {"-", match_minus},
{"/", match_replace}, {"/", match_replace},
{"<-", match_capture}, {"<-", match_capture},
{"<-arg", match_capture_arg},
{"<-c", match_capture_constant}, {"<-c", match_capture_constant},
{"<-g", match_group}, {"<-g", match_group},
{"<-p", match_position}, {"<-p", match_position},
@ -346,7 +356,9 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
if (!janet_checkint(peg)) if (!janet_checkint(peg))
janet_panicf("numbers in peg must be integers, got %v", peg); janet_panicf("numbers in peg must be integers, got %v", peg);
int32_t n = janet_unwrap_integer(peg); int32_t n = janet_unwrap_integer(peg);
return (s->text_end >= text + n) ? n : -1; if (n < 0) /* Invert pattern */
return (text - n > s->text_end) ? 0 : -1;
return (text + n > s->text_end) ? -1 : n;
} }
case JANET_STRING: case JANET_STRING:
/* Match a sequence of bytes */ /* Match a sequence of bytes */
@ -371,7 +383,7 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
sizeof(specials)/sizeof(MatcherPair), sizeof(specials)/sizeof(MatcherPair),
sizeof(MatcherPair), sizeof(MatcherPair),
sym); sym);
if (!mp) janet_panicf("unknown special form %v", peg); if (!mp) janet_panicf("unknown special form %p", peg);
if (s->depth-- == 0) if (s->depth-- == 0)
janet_panic("recursed too deeply"); janet_panic("recursed too deeply");
@ -413,12 +425,19 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
/* C Functions */ /* C Functions */
static Janet cfun_match(int32_t argc, Janet *argv) { static Janet cfun_match(int32_t argc, Janet *argv) {
janet_arity(argc, 2, 3); janet_arity(argc, 2, -1);
JanetByteView bytes = janet_getbytes(argv, 1); JanetByteView bytes = janet_getbytes(argv, 1);
int32_t start = (argc == 3) ? int32_t start;
start = janet_gethalfrange(argv, 2, bytes.len, "offset")
: 0;
State s; State s;
if (argc > 2) {
start = janet_gethalfrange(argv, 2, bytes.len, "offset");
s.extrac = argc - 3;
s.extrav = argv + 3;
} else {
start = 0;
s.extrac = 0;
s.extrav = NULL;
}
s.flags = 0; s.flags = 0;
s.text_start = bytes.bytes; s.text_start = bytes.bytes;
s.text_end = bytes.bytes + bytes.len; s.text_end = bytes.bytes + bytes.len;

View File

@ -155,16 +155,36 @@
# Peg # Peg
(defn check-match
[pat text should-match]
(def result (peg/match pat text))
(assert (= (not should-match) (not result)) text))
# Just numbers
(check-match '(* 4 -1) "abcd" true)
(check-match '(* 4 -1) "abc" false)
(check-match '(* 4 -1) "abcde" false)
# Simple pattern
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "hello" true)
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "hello world" false)
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "1he11o" false)
# IP address
(def ip-address (def ip-address
'{:d (range "09") '{:d (range "09")
:0-4 (range "04") :0-4 (range "04")
:0-5 (range "05") :0-5 (range "05")
:block (+ (* "25" :0-5) (* "2" :0-4 :d) (* "1" :d :d) (between 1 2 :d)) :block (+ (* "25" :0-5) (* "2" :0-4 :d) (* "1" :d :d) (between 1 2 :d))
:main (* :block (between 3 3 (* "." :block)))}) :main (* :block (between 3 3 (* "." :block)) -1)})
(assert (peg/match ip-address "0.0.0.0") "peg/match 1") (check-match ip-address "0.0.0.0" true)
(assert (peg/match ip-address "1.2.3.4") "peg/match 2") (check-match ip-address "1.2.3.4" true)
(assert (not (peg/match ip-address "256.2.3.4")) "peg/match 3") (check-match ip-address "256.2.3.4" false)
(check-match ip-address "256.2.3.2514" false)
# Substitution test with peg # Substitution test with peg