summaryrefslogtreecommitdiff
path: root/Zend/zend_multibyte.h
diff options
context:
space:
mode:
authorMasaki Fujimoto <fujimoto@php.net>2003-08-11 05:24:42 +0000
committerMasaki Fujimoto <fujimoto@php.net>2003-08-11 05:24:42 +0000
commitab9dcec292eb8b7a928cd111044a6a3e374e2412 (patch)
tree85917557d38a4bd8d75028b24de38805d521b953 /Zend/zend_multibyte.h
parent4320c6994f0f84929141ea2543d95505e465b5d4 (diff)
downloadphp-git-ab9dcec292eb8b7a928cd111044a6a3e374e2412.tar.gz
- added script encoding support to Zend Engine 2.
this enables ZE2 to gracefully parse scripts written in UTF-8 (with BOM), UTF-16, UTF-32, Shift_JIS, ISO-2022-JP etc... (when configured with '--enable-zend-multibyte' and '--enable-mbstring')
Diffstat (limited to 'Zend/zend_multibyte.h')
-rw-r--r--Zend/zend_multibyte.h79
1 files changed, 79 insertions, 0 deletions
diff --git a/Zend/zend_multibyte.h b/Zend/zend_multibyte.h
new file mode 100644
index 0000000000..58e0228dc0
--- /dev/null
+++ b/Zend/zend_multibyte.h
@@ -0,0 +1,79 @@
+/*
+ +----------------------------------------------------------------------+
+ | Zend Engine |
+ +----------------------------------------------------------------------+
+ | Copyright (c) 1998-2003 Zend Technologies Ltd. (http://www.zend.com) |
+ +----------------------------------------------------------------------+
+ | This source file is subject to version 2.00 of the Zend license, |
+ | that is bundled with this package in the file LICENSE, and is |
+ | available at through the world-wide-web at |
+ | http://www.zend.com/license/2_00.txt. |
+ | If you did not receive a copy of the Zend license and are unable to |
+ | obtain it through the world-wide-web, please send a note to |
+ | license@zend.com so we can mail you a copy immediately. |
+ +----------------------------------------------------------------------+
+ | Authors: Masaki Fujimoto <fujimoto@php.net> |
+ | Rui Hirokawa <hirokawa@php.net> |
+ +----------------------------------------------------------------------+
+*/
+
+/* $Id$ */
+
+#ifndef ZEND_MULTIBYTE_H
+#define ZEND_MULTIBYTE_H
+
+#ifdef ZEND_MULTIBYTE
+
+#define BOM_UTF32_BE "\x00\x00\xfe\xff"
+#define BOM_UTF32_LE "\xff\xfe\x00\x00"
+#define BOM_UTF16_BE "\xfe\xff"
+#define BOM_UTF16_LE "\xff\xfe"
+#define BOM_UTF8 "\xef\xbb\xbf"
+
+typedef int (*zend_encoding_filter)(char **str, int *str_length, const char *buf, int length TSRMLS_DC);
+
+typedef char* (*zend_encoding_detector)(const char *string, int length, char *list TSRMLS_DC);
+
+typedef int (*zend_encoding_converter)(char **to, int *to_length, const char *from, int from_length, const char *encoding_to, const char *encoding_from TSRMLS_DC);
+
+typedef int (*zend_encoding_oddlen)(const char *string, int length, const char *encoding TSRMLS_DC);
+
+typedef struct _zend_encoding {
+ zend_encoding_filter input_filter; /* escape input filter */
+ zend_encoding_filter output_filter; /* escape output filter */
+ const char *name; /* encoding name */
+ const char *(*aliases)[]; /* encoding name aliases */
+ int compatible; /* flex compatible or not */
+} zend_encoding;
+
+
+/*
+ * zend multibyte APIs
+ */
+BEGIN_EXTERN_C()
+ZEND_API int zend_multibyte_set_script_encoding(char *encoding_list, int encoding_list_size TSRMLS_DC);
+ZEND_API int zend_multibyte_set_internal_encoding(char *encoding_name, int encoding_name_size TSRMLS_DC);
+ZEND_API int zend_multibyte_set_functions(zend_encoding_detector encoding_detector, zend_encoding_converter encoding_converter, zend_encoding_oddlen encoding_oddlen TSRMLS_DC);
+ZEND_API int zend_multibyte_set_filter(zend_encoding *onetime_encoding TSRMLS_DC);
+ZEND_API zend_encoding* zend_multibyte_fetch_encoding(char *encoding_name);
+ZEND_API int zend_multibyte_script_encoding_filter(char **to, int *to_length, const char *from, int from_length TSRMLS_DC);
+ZEND_API int zend_multibyte_internal_encoding_filter(char **to, int *to_length, const char *from, int from_length TSRMLS_DC);
+
+/* in zend_language_scanner.l */
+ZEND_API void zend_multibyte_yyinput_again(zend_encoding_filter old_input_filter, zend_encoding *old_encoding TSRMLS_DC);
+ZEND_API int zend_multibyte_yyinput(zend_file_handle *file_handle, char *buf, size_t len TSRMLS_DC);
+ZEND_API int zend_multibyte_read_script(TSRMLS_D);
+END_EXTERN_C()
+
+#endif /* ZEND_MULTIBYTE */
+
+#endif /* ZEND_MULTIBYTE_H */
+
+/*
+ * Local variables:
+ * tab-width: 4
+ * c-basic-offset: 4
+ * End:
+ * vim600: sw=4 ts=4 tw=78
+ * vim<600: sw=4 ts=4 tw=78
+ */