summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKarl Williamson <khw@cpan.org>2017-11-18 09:35:25 -0700
committerKarl Williamson <khw@cpan.org>2017-11-18 09:47:16 -0700
commit9b79e9e3431d11e79a4f85268f70130b7b4369f6 (patch)
treea3f683a13b8f98680f9e5be0903b622e05ba3c16
parent04f89ea7f30fbde4ccaefee940117aa6a27d5fd0 (diff)
downloadperl-9b79e9e3431d11e79a4f85268f70130b7b4369f6.tar.gz
PATCH: [perl #132463] perluniprops for \p{Word}
perluniprops was not updated to reflect the changes made to what \p{Word} contains as of 5.18. What was added was the code points that have the Join_Control property, which, so far, only contain U+200C and U+200D. This commit uses Join Control instead of the hard-coded code point numbers, so that when Unicode changes it, it automatically will still be valid. Thanks for spotting this.
-rw-r--r--charclass_invlists.h2
-rw-r--r--lib/unicore/mktables3
-rw-r--r--regcharclass.h2
3 files changed, 4 insertions, 3 deletions
diff --git a/charclass_invlists.h b/charclass_invlists.h
index 1ae981214c..4eb26efa91 100644
--- a/charclass_invlists.h
+++ b/charclass_invlists.h
@@ -97454,7 +97454,7 @@ static const U8 WB_table[24][24] = {
* be0f129691d479aa38646e4ca0ec1ee576ae7f75b0300a5624a7fa862fa8abba lib/unicore/extracted/DLineBreak.txt
* 92449d354d9f6b6f2f97a292ebb59f6344ffdeb83d120d7d23e569c43ba67cd5 lib/unicore/extracted/DNumType.txt
* e3a319527153b0c6c0c549b40fc6f3a01a7a0dcd6620784391db25901df3b154 lib/unicore/extracted/DNumValues.txt
- * 409910af8e9ad2cba213c70f936a6c716494029a8346e8b55dd44275cc51d35d lib/unicore/mktables
+ * d905c655c0cc448f19894613ce87026dea667bb66c65937667424fc0afdc90c4 lib/unicore/mktables
* 21653d2744fdd071f9ef138c805393901bb9547cf3e777ebf50215a191f986ea lib/unicore/version
* 913d2f93f3cb6cdf1664db888bf840bc4eb074eef824e082fceda24a9445e60c regen/charset_translations.pl
* 48418cbf454eb9ef35c73468ed5ef72ad8603490eabe74181ce4fae42ec72579 regen/mk_invlists.pl
diff --git a/lib/unicore/mktables b/lib/unicore/mktables
index 1386735e2f..200ae46d30 100644
--- a/lib/unicore/mktables
+++ b/lib/unicore/mktables
@@ -14499,7 +14499,8 @@ sub compile_perl() {
my $Word = $perl->add_match_table('Word', Full_Name => 'XPosixWord',
Description => '\w, including beyond ASCII;'
- . ' = \p{Alnum} + \pM + \p{Pc}',
+ . ' = \p{Alnum} + \pM + \p{Pc}'
+ . ' + \p{Join_Control}',
Initialize => $Alnum + $gc->table('Mark'),
);
my $Pc = $gc->table('Connector_Punctuation'); # 'Pc' Not in release 1
diff --git a/regcharclass.h b/regcharclass.h
index 6b3e846aaa..38ddd84c55 100644
--- a/regcharclass.h
+++ b/regcharclass.h
@@ -1898,7 +1898,7 @@
* be0f129691d479aa38646e4ca0ec1ee576ae7f75b0300a5624a7fa862fa8abba lib/unicore/extracted/DLineBreak.txt
* 92449d354d9f6b6f2f97a292ebb59f6344ffdeb83d120d7d23e569c43ba67cd5 lib/unicore/extracted/DNumType.txt
* e3a319527153b0c6c0c549b40fc6f3a01a7a0dcd6620784391db25901df3b154 lib/unicore/extracted/DNumValues.txt
- * 409910af8e9ad2cba213c70f936a6c716494029a8346e8b55dd44275cc51d35d lib/unicore/mktables
+ * d905c655c0cc448f19894613ce87026dea667bb66c65937667424fc0afdc90c4 lib/unicore/mktables
* 21653d2744fdd071f9ef138c805393901bb9547cf3e777ebf50215a191f986ea lib/unicore/version
* 913d2f93f3cb6cdf1664db888bf840bc4eb074eef824e082fceda24a9445e60c regen/charset_translations.pl
* 9ea6338945a7d70e5ea4b31ac7856c0b521df96be002e94b4b3b7d31debbf3ab regen/regcharclass.pl