mirror of
https://github.com/janet-lang/janet
synced 2025-01-11 08:00:27 +00:00
Add some more tests, add parameterized captures to patterns,
and fix some bugs.
This commit is contained in:
parent
d7626f8c57
commit
83f4a11bf3
@ -46,6 +46,7 @@ Janet makes a good system scripting language, or a language to embed in other pr
|
|||||||
* Lexical scoping
|
* Lexical scoping
|
||||||
* Imperative programming as well as functional
|
* Imperative programming as well as functional
|
||||||
* REPL
|
* REPL
|
||||||
|
* Parsing Expression Grammars built in to the core library
|
||||||
* 300+ functions and macros in the core library
|
* 300+ functions and macros in the core library
|
||||||
* Interactive environment with detailed stack traces
|
* Interactive environment with detailed stack traces
|
||||||
|
|
||||||
|
@ -42,6 +42,8 @@ typedef struct {
|
|||||||
JanetTable *grammar;
|
JanetTable *grammar;
|
||||||
JanetArray *captures;
|
JanetArray *captures;
|
||||||
JanetBuffer *scratch;
|
JanetBuffer *scratch;
|
||||||
|
const Janet *extrav;
|
||||||
|
int32_t extrac;
|
||||||
int flags;
|
int flags;
|
||||||
} State;
|
} State;
|
||||||
|
|
||||||
@ -124,7 +126,6 @@ static int32_t match_choice(State *s, int32_t argc, const Janet *argv, const uin
|
|||||||
static int32_t match_sequence(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
|
static int32_t match_sequence(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
|
||||||
int32_t traversed = 0;
|
int32_t traversed = 0;
|
||||||
for (int32_t i = 0; i < argc; i++) {
|
for (int32_t i = 0; i < argc; i++) {
|
||||||
if (text + traversed >= s->text_end) return -1;
|
|
||||||
int32_t result = match(s, argv[i], text + traversed);
|
int32_t result = match(s, argv[i], text + traversed);
|
||||||
if (result < 0) return -1;
|
if (result < 0) return -1;
|
||||||
traversed += result;
|
traversed += result;
|
||||||
@ -259,6 +260,14 @@ static int32_t match_capture_constant(State *s, int32_t argc, const Janet *argv,
|
|||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Capture nth extra argument to peg/match */
|
||||||
|
static int32_t match_capture_arg(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
|
||||||
|
janet_fixarity(argc, 1);
|
||||||
|
int32_t n = janet_gethalfrange(argv, 0, s->extrac, "n");
|
||||||
|
push_capture(s, s->extrav[n], text, 0);
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
/* Capture replace */
|
/* Capture replace */
|
||||||
static int32_t match_replace(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
|
static int32_t match_replace(State *s, int32_t argc, const Janet *argv, const uint8_t *text) {
|
||||||
janet_fixarity(argc, 2);
|
janet_fixarity(argc, 2);
|
||||||
@ -319,6 +328,7 @@ static const MatcherPair specials[] = {
|
|||||||
{"-", match_minus},
|
{"-", match_minus},
|
||||||
{"/", match_replace},
|
{"/", match_replace},
|
||||||
{"<-", match_capture},
|
{"<-", match_capture},
|
||||||
|
{"<-arg", match_capture_arg},
|
||||||
{"<-c", match_capture_constant},
|
{"<-c", match_capture_constant},
|
||||||
{"<-g", match_group},
|
{"<-g", match_group},
|
||||||
{"<-p", match_position},
|
{"<-p", match_position},
|
||||||
@ -346,7 +356,9 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
|
|||||||
if (!janet_checkint(peg))
|
if (!janet_checkint(peg))
|
||||||
janet_panicf("numbers in peg must be integers, got %v", peg);
|
janet_panicf("numbers in peg must be integers, got %v", peg);
|
||||||
int32_t n = janet_unwrap_integer(peg);
|
int32_t n = janet_unwrap_integer(peg);
|
||||||
return (s->text_end >= text + n) ? n : -1;
|
if (n < 0) /* Invert pattern */
|
||||||
|
return (text - n > s->text_end) ? 0 : -1;
|
||||||
|
return (text + n > s->text_end) ? -1 : n;
|
||||||
}
|
}
|
||||||
case JANET_STRING:
|
case JANET_STRING:
|
||||||
/* Match a sequence of bytes */
|
/* Match a sequence of bytes */
|
||||||
@ -371,7 +383,7 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
|
|||||||
sizeof(specials)/sizeof(MatcherPair),
|
sizeof(specials)/sizeof(MatcherPair),
|
||||||
sizeof(MatcherPair),
|
sizeof(MatcherPair),
|
||||||
sym);
|
sym);
|
||||||
if (!mp) janet_panicf("unknown special form %v", peg);
|
if (!mp) janet_panicf("unknown special form %p", peg);
|
||||||
if (s->depth-- == 0)
|
if (s->depth-- == 0)
|
||||||
janet_panic("recursed too deeply");
|
janet_panic("recursed too deeply");
|
||||||
|
|
||||||
@ -413,12 +425,19 @@ static int32_t match(State *s, Janet peg, const uint8_t *text) {
|
|||||||
/* C Functions */
|
/* C Functions */
|
||||||
|
|
||||||
static Janet cfun_match(int32_t argc, Janet *argv) {
|
static Janet cfun_match(int32_t argc, Janet *argv) {
|
||||||
janet_arity(argc, 2, 3);
|
janet_arity(argc, 2, -1);
|
||||||
JanetByteView bytes = janet_getbytes(argv, 1);
|
JanetByteView bytes = janet_getbytes(argv, 1);
|
||||||
int32_t start = (argc == 3) ?
|
int32_t start;
|
||||||
start = janet_gethalfrange(argv, 2, bytes.len, "offset")
|
|
||||||
: 0;
|
|
||||||
State s;
|
State s;
|
||||||
|
if (argc > 2) {
|
||||||
|
start = janet_gethalfrange(argv, 2, bytes.len, "offset");
|
||||||
|
s.extrac = argc - 3;
|
||||||
|
s.extrav = argv + 3;
|
||||||
|
} else {
|
||||||
|
start = 0;
|
||||||
|
s.extrac = 0;
|
||||||
|
s.extrav = NULL;
|
||||||
|
}
|
||||||
s.flags = 0;
|
s.flags = 0;
|
||||||
s.text_start = bytes.bytes;
|
s.text_start = bytes.bytes;
|
||||||
s.text_end = bytes.bytes + bytes.len;
|
s.text_end = bytes.bytes + bytes.len;
|
||||||
|
@ -155,16 +155,36 @@
|
|||||||
|
|
||||||
# Peg
|
# Peg
|
||||||
|
|
||||||
|
(defn check-match
|
||||||
|
[pat text should-match]
|
||||||
|
(def result (peg/match pat text))
|
||||||
|
(assert (= (not should-match) (not result)) text))
|
||||||
|
|
||||||
|
# Just numbers
|
||||||
|
|
||||||
|
(check-match '(* 4 -1) "abcd" true)
|
||||||
|
(check-match '(* 4 -1) "abc" false)
|
||||||
|
(check-match '(* 4 -1) "abcde" false)
|
||||||
|
|
||||||
|
# Simple pattern
|
||||||
|
|
||||||
|
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "hello" true)
|
||||||
|
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "hello world" false)
|
||||||
|
(check-match '(* (at-least 1 (range "az" "AZ")) (not 1)) "1he11o" false)
|
||||||
|
|
||||||
|
# IP address
|
||||||
|
|
||||||
(def ip-address
|
(def ip-address
|
||||||
'{:d (range "09")
|
'{:d (range "09")
|
||||||
:0-4 (range "04")
|
:0-4 (range "04")
|
||||||
:0-5 (range "05")
|
:0-5 (range "05")
|
||||||
:block (+ (* "25" :0-5) (* "2" :0-4 :d) (* "1" :d :d) (between 1 2 :d))
|
:block (+ (* "25" :0-5) (* "2" :0-4 :d) (* "1" :d :d) (between 1 2 :d))
|
||||||
:main (* :block (between 3 3 (* "." :block)))})
|
:main (* :block (between 3 3 (* "." :block)) -1)})
|
||||||
|
|
||||||
(assert (peg/match ip-address "0.0.0.0") "peg/match 1")
|
(check-match ip-address "0.0.0.0" true)
|
||||||
(assert (peg/match ip-address "1.2.3.4") "peg/match 2")
|
(check-match ip-address "1.2.3.4" true)
|
||||||
(assert (not (peg/match ip-address "256.2.3.4")) "peg/match 3")
|
(check-match ip-address "256.2.3.4" false)
|
||||||
|
(check-match ip-address "256.2.3.2514" false)
|
||||||
|
|
||||||
# Substitution test with peg
|
# Substitution test with peg
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user