From dc4bab73d295bd6372c5b57714105128c54f8371 Mon Sep 17 00:00:00 2001 From: Alex Shinn Date: Fri, 29 Nov 2013 23:59:04 +0900 Subject: [PATCH] Expanging the grapheme cases so that the hangul variants are never empty. --- lib/chibi/regexp.scm | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/lib/chibi/regexp.scm b/lib/chibi/regexp.scm index 202244a4..881e1ff7 100644 --- a/lib/chibi/regexp.scm +++ b/lib/chibi/regexp.scm @@ -696,10 +696,22 @@ ((grapheme) (->rx `(or (: "\r\n") - (: (* ,char-set:hangul-l) + (: (+ ,char-set:hangul-l) (or ,char-set:hangul-lvt (: (? ,char-set:hangul-lv) (* ,char-set:hangul-v))) (* ,char-set:hangul-t)) + (: (* ,char-set:hangul-l) + (or ,char-set:hangul-lvt + (: ,char-set:hangul-lv (* ,char-set:hangul-v))) + (* ,char-set:hangul-t)) + (: (* ,char-set:hangul-l) + (or ,char-set:hangul-lvt + (: (? ,char-set:hangul-lv) (+ ,char-set:hangul-v))) + (* ,char-set:hangul-t)) + (: (* ,char-set:hangul-l) + (or ,char-set:hangul-lvt + (: (? ,char-set:hangul-lv) (* ,char-set:hangul-v))) + (+ ,char-set:hangul-t)) (+ ,char-set:regional-indicator) control (: (~ control ("\r\n"))