blob: f5b05deaa063e339a82005fb808dc94b15e82901 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
|
%prep
if ! zmodload zsh/pcre 2>/dev/null
then
ZTST_unimplemented="the zsh/pcre module is not available"
return 0
fi
setopt rematch_pcre
# Find a UTF-8 locale.
setopt multibyte
# Don't let LC_* override our choice of locale.
unset -m LC_\*
mb_ok=
langs=(en_{US,GB}.{UTF-,utf}8 en.UTF-8
$(locale -a 2>/dev/null | egrep 'utf8|UTF-8'))
for LANG in $langs; do
if [[ é = ? ]]; then
mb_ok=1
break;
fi
done
if [[ -z $mb_ok ]]; then
ZTST_unimplemented="no UTF-8 locale or multibyte mode is not implemented"
else
print -u $ZTST_fd Testing PCRE multibyte with locale $LANG
mkdir multibyte.tmp && cd multibyte.tmp
fi
%test
[[ 'foo→bar' =~ .([^[:ascii:]]). ]]
print $MATCH
print $match[1]
0:Basic non-ASCII regexp matching
>o→b
>→
[[ foo =~ f.+ ]] ; print $?
[[ foo =~ x.+ ]] ; print $?
[[ ! foo =~ f.+ ]] ; print $?
[[ ! foo =~ x.+ ]] ; print $?
[[ foo =~ f.+ && bar =~ b.+ ]] ; print $?
[[ foo =~ x.+ && bar =~ b.+ ]] ; print $?
[[ foo =~ f.+ && bar =~ x.+ ]] ; print $?
[[ ! foo =~ f.+ && bar =~ b.+ ]] ; print $?
[[ foo =~ f.+ && ! bar =~ b.+ ]] ; print $?
[[ ! ( foo =~ f.+ && bar =~ b.+ ) ]] ; print $?
[[ ! foo =~ x.+ && bar =~ b.+ ]] ; print $?
[[ foo =~ x.+ && ! bar =~ b.+ ]] ; print $?
[[ ! ( foo =~ x.+ && bar =~ b.+ ) ]] ; print $?
0:Regex result inversion detection
>0
>1
>1
>0
>0
>1
>1
>1
>1
>1
>0
>1
>0
# Note that PCRE_ANCHORED only means anchored at the start
# Also note that we don't unset MATCH/match on failed match (and it's an
# open issue as to whether or not we should)
pcre_compile '.(→.)'
pcre_match foo→bar
print $? $MATCH $match ; unset MATCH match
pcre_match foo.bar
print $? $MATCH $match ; unset MATCH match
pcre_match foo†bar
print $? $MATCH $match ; unset MATCH match
pcre_match foo→†ar
print $? $MATCH $match ; unset MATCH match
pcre_study
pcre_match foo→bar
print $? $MATCH $match ; unset MATCH match
pcre_compile -a '.(→.)'
pcre_match foo→bar
print $? $MATCH $match ; unset MATCH match
pcre_match o→bar
print $? $MATCH $match ; unset MATCH match
pcre_match o→b
print $? $MATCH $match ; unset MATCH match
pcre_compile 'x.(→.)'
pcre_match xo→t
print $? $MATCH $match ; unset MATCH match
pcre_match Xo→t
print $? $MATCH $match ; unset MATCH match
pcre_compile -i 'x.(→.)'
pcre_match xo→t
print $? $MATCH $match ; unset MATCH match
pcre_match Xo→t
print $? $MATCH $match ; unset MATCH match
0:pcre_compile interface testing: basic, anchored & case-insensitive
>0 o→b →b
>1
>1
>0 o→† →†
>0 o→b →b
>1
>0 o→b →b
>0 o→b →b
>0 xo→t →t
>1
>0 xo→t →t
>0 Xo→t →t
|