1 | #! /bin/sh
|
---|
2 | # Ensure that, with -P, Unicode \p{} symbols are correctly matched.
|
---|
3 | #
|
---|
4 | # Copyright (C) 2012-2021 Free Software Foundation, Inc.
|
---|
5 | #
|
---|
6 | # Copying and distribution of this file, with or without modification,
|
---|
7 | # are permitted in any medium without royalty provided the copyright
|
---|
8 | # notice and this notice are preserved.
|
---|
9 |
|
---|
10 | . "${srcdir=.}/init.sh"; path_prepend_ ../src
|
---|
11 | require_en_utf8_locale_
|
---|
12 | LC_ALL=en_US.UTF-8 require_pcre_
|
---|
13 |
|
---|
14 | fail=0
|
---|
15 |
|
---|
16 | echo '$' | LC_ALL=en_US.UTF-8 grep -qP '\p{S}' \
|
---|
17 | || skip_ 'PCRE support is compiled out, or it does not support properties'
|
---|
18 |
|
---|
19 | euro='\342\202\254 euro'
|
---|
20 | printf "$euro\\n" > in || framework_failure_
|
---|
21 |
|
---|
22 | # The euro sign has the unicode "Symbol" property, so this must match:
|
---|
23 | LC_ALL=en_US.UTF-8 grep -P '^\p{S}' in > out || fail=1
|
---|
24 | compare in out || fail=1
|
---|
25 |
|
---|
26 | # This RE must *not* match in the C locale, because the first
|
---|
27 | # byte is not a "Symbol".
|
---|
28 | LC_ALL=C grep -P '^\p{S}' in > out && fail=1
|
---|
29 | compare /dev/null out || fail=1
|
---|
30 |
|
---|
31 | LC_ALL=en_US.UTF-8 grep -P '^. euro$' in > out2 || fail=1
|
---|
32 | compare in out2 || fail=1
|
---|
33 |
|
---|
34 | LC_ALL=en_US.UTF-8 grep -oP '. euro' in > out3 || fail=1
|
---|
35 | compare in out3 || fail=1
|
---|
36 |
|
---|
37 | LC_ALL=en_US.UTF-8 grep -P '^\P{S}' in > out4
|
---|
38 | compare /dev/null out4 || fail=1
|
---|
39 |
|
---|
40 | Exit $fail
|
---|