mirror of
https://github.com/php/php-src.git
synced 2025-08-15 13:38:49 +02:00

This is a comprehensive refactoring of the error mechanism of the Intl extension. By moving the prefixing of the current method/function being executed to actual error message creation by accessing the execution context, we get the following benefits: - Accurate error messages indicating *what* call caused the error - As we *always* "copy" the message, the `copyMsg` arg becomes unused, meaning we can reduce the size of the `intl_error` struct by 4 bytes. - Saving it as a zend_string means we know the length of the message - Remove the need to pass around a "function name" `char*` across multiple calls - Use Intl's exception mechanism to generate exceptions for constructor call - This removes the need for replacing the error handler - Which didn't do anything anyway in silent mode, which required throwing non-descriptive exceptions
374 lines
9.1 KiB
C++
374 lines
9.1 KiB
C++
/*
|
|
+----------------------------------------------------------------------+
|
|
| This source file is subject to version 3.01 of the PHP license, |
|
|
| that is bundled with this package in the file LICENSE, and is |
|
|
| available through the world-wide-web at the following url: |
|
|
| https://www.php.net/license/3_01.txt |
|
|
| If you did not receive a copy of the PHP license and are unable to |
|
|
| obtain it through the world-wide-web, please send a note to |
|
|
| license@php.net so we can mail you a copy immediately. |
|
|
+----------------------------------------------------------------------+
|
|
| Authors: Gustavo Lopes <cataphract@php.net> |
|
|
+----------------------------------------------------------------------+
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#include <unicode/brkiter.h>
|
|
#include "codepointiterator_internal.h"
|
|
|
|
#include "breakiterator_iterators.h"
|
|
|
|
extern "C" {
|
|
#include "../php_intl.h"
|
|
#define USE_BREAKITERATOR_POINTER 1
|
|
#include "breakiterator_class.h"
|
|
#include "../locale/locale.h"
|
|
#include <zend_exceptions.h>
|
|
#include <zend_interfaces.h>
|
|
}
|
|
|
|
using PHP::CodePointBreakIterator;
|
|
using icu::BreakIterator;
|
|
using icu::Locale;
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, __construct)
|
|
{
|
|
zend_throw_exception( NULL,
|
|
"An object of this type cannot be created with the new operator",
|
|
0 );
|
|
}
|
|
|
|
static void _breakiter_factory(
|
|
BreakIterator *(*func)(const Locale&, UErrorCode&),
|
|
INTERNAL_FUNCTION_PARAMETERS)
|
|
{
|
|
BreakIterator *biter;
|
|
char *locale_str = NULL;
|
|
size_t dummy;
|
|
UErrorCode status = UErrorCode();
|
|
intl_error_reset(NULL);
|
|
|
|
ZEND_PARSE_PARAMETERS_START(0, 1)
|
|
Z_PARAM_OPTIONAL
|
|
Z_PARAM_STRING_OR_NULL(locale_str, dummy)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
if (locale_str == NULL) {
|
|
locale_str = (char *)intl_locale_get_default();
|
|
}
|
|
|
|
biter = func(Locale::createFromName(locale_str), status);
|
|
intl_error_set_code(NULL, status);
|
|
if (U_FAILURE(status)) {
|
|
intl_error_set_custom_msg(NULL, "error creating BreakIterator");
|
|
RETURN_NULL();
|
|
}
|
|
|
|
breakiterator_object_create(return_value, biter, 1);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createWordInstance)
|
|
{
|
|
_breakiter_factory(
|
|
&BreakIterator::createWordInstance,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createLineInstance)
|
|
{
|
|
_breakiter_factory(
|
|
&BreakIterator::createLineInstance,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createCharacterInstance)
|
|
{
|
|
_breakiter_factory(
|
|
&BreakIterator::createCharacterInstance,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createSentenceInstance)
|
|
{
|
|
_breakiter_factory(
|
|
&BreakIterator::createSentenceInstance,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createTitleInstance)
|
|
{
|
|
_breakiter_factory(
|
|
&BreakIterator::createTitleInstance,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, createCodePointInstance)
|
|
{
|
|
intl_error_reset(NULL);
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
CodePointBreakIterator *cpbi = new CodePointBreakIterator();
|
|
breakiterator_object_create(return_value, cpbi, 1);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getText)
|
|
{
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
if (Z_ISUNDEF(bio->text)) {
|
|
RETURN_NULL();
|
|
} else {
|
|
ZVAL_COPY(return_value, &bio->text);
|
|
}
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, setText)
|
|
{
|
|
UText *ut = NULL;
|
|
zend_string *text;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(1, 1)
|
|
Z_PARAM_STR(text)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
ut = utext_openUTF8(ut, ZSTR_VAL(text), ZSTR_LEN(text), BREAKITER_ERROR_CODE_P(bio));
|
|
INTL_METHOD_CHECK_STATUS(bio, "error opening UText");
|
|
|
|
bio->biter->setText(ut, BREAKITER_ERROR_CODE(bio));
|
|
utext_close(ut); /* ICU shallow clones the UText */
|
|
INTL_METHOD_CHECK_STATUS(bio, "error calling BreakIterator::setText()");
|
|
|
|
/* When ICU clones the UText, it does not copy the buffer, so we have to
|
|
* keep the string buffer around by holding a reference to its zval. This
|
|
* also allows a faste implementation of getText() */
|
|
zval_ptr_dtor(&bio->text);
|
|
ZVAL_STR_COPY(&bio->text, text);
|
|
|
|
RETURN_TRUE;
|
|
}
|
|
|
|
static void _breakiter_no_args_ret_int32(
|
|
int32_t (BreakIterator::*func)(),
|
|
INTERNAL_FUNCTION_PARAMETERS)
|
|
{
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
int32_t res = (bio->biter->*func)();
|
|
|
|
RETURN_LONG((zend_long)res);
|
|
}
|
|
|
|
static void _breakiter_int32_ret_int32(
|
|
int32_t (BreakIterator::*func)(int32_t),
|
|
INTERNAL_FUNCTION_PARAMETERS)
|
|
{
|
|
zend_long arg;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(1, 1)
|
|
Z_PARAM_LONG(arg)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
if (UNEXPECTED(arg < INT32_MIN || arg > INT32_MAX)) {
|
|
zend_argument_value_error(1, "must be between %d and %d", INT32_MIN, INT32_MAX);
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
int32_t res = (bio->biter->*func)((int32_t)arg);
|
|
|
|
RETURN_LONG((zend_long)res);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, first)
|
|
{
|
|
_breakiter_no_args_ret_int32(&BreakIterator::first,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, last)
|
|
{
|
|
_breakiter_no_args_ret_int32(&BreakIterator::last,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, previous)
|
|
{
|
|
_breakiter_no_args_ret_int32(&BreakIterator::previous,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, next)
|
|
{
|
|
zval *arg = NULL;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(0, 1)
|
|
Z_PARAM_OPTIONAL
|
|
Z_PARAM_ZVAL_OR_NULL(arg)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
if (arg == NULL) {
|
|
ZEND_NUM_ARGS() = 0;
|
|
_breakiter_no_args_ret_int32(&BreakIterator::next,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
} else {
|
|
_breakiter_int32_ret_int32(&BreakIterator::next,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, current)
|
|
{
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
int32_t res = bio->biter->current();
|
|
|
|
RETURN_LONG((zend_long)res);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, following)
|
|
{
|
|
_breakiter_int32_ret_int32(
|
|
&BreakIterator::following,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, preceding)
|
|
{
|
|
_breakiter_int32_ret_int32(
|
|
&BreakIterator::preceding,
|
|
INTERNAL_FUNCTION_PARAM_PASSTHRU);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, isBoundary)
|
|
{
|
|
zend_long offset;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(1, 1)
|
|
Z_PARAM_LONG(offset)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
if (UNEXPECTED(offset < INT32_MIN || offset > INT32_MAX)) {
|
|
zend_argument_value_error(1, "must be between %d and %d", INT32_MIN, INT32_MAX);
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
UBool res = bio->biter->isBoundary((int32_t)offset);
|
|
|
|
RETURN_BOOL((zend_long)res);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getLocale)
|
|
{
|
|
zend_long locale_type;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(1, 1)
|
|
Z_PARAM_LONG(locale_type)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
/* TODO: Change to ValueError? */
|
|
if (locale_type != ULOC_ACTUAL_LOCALE && locale_type != ULOC_VALID_LOCALE) {
|
|
intl_error_set(NULL, U_ILLEGAL_ARGUMENT_ERROR,
|
|
"invalid locale type");
|
|
RETURN_FALSE;
|
|
}
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
Locale locale = bio->biter->getLocale((ULocDataLocaleType)locale_type,
|
|
BREAKITER_ERROR_CODE(bio));
|
|
INTL_METHOD_CHECK_STATUS(bio, "Call to ICU method has failed");
|
|
|
|
RETURN_STRING(locale.getName());
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getPartsIterator)
|
|
{
|
|
zend_long key_type = 0;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_START(0, 1)
|
|
Z_PARAM_OPTIONAL
|
|
Z_PARAM_LONG(key_type)
|
|
ZEND_PARSE_PARAMETERS_END();
|
|
|
|
if (key_type != PARTS_ITERATOR_KEY_SEQUENTIAL
|
|
&& key_type != PARTS_ITERATOR_KEY_LEFT
|
|
&& key_type != PARTS_ITERATOR_KEY_RIGHT) {
|
|
zend_argument_value_error(1, "must be one of IntlPartsIterator::KEY_SEQUENTIAL, "
|
|
"IntlPartsIterator::KEY_LEFT, or IntlPartsIterator::KEY_RIGHT");
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
BREAKITER_METHOD_FETCH_OBJECT;
|
|
|
|
IntlIterator_from_BreakIterator_parts(
|
|
object, return_value, (parts_iter_key_type)key_type);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getErrorCode)
|
|
{
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
/* Fetch the object (without resetting its last error code ). */
|
|
bio = Z_INTL_BREAKITERATOR_P(object);
|
|
RETURN_LONG((zend_long)BREAKITER_ERROR_CODE(bio));
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getErrorMessage)
|
|
{
|
|
zend_string* message = NULL;
|
|
BREAKITER_METHOD_INIT_VARS;
|
|
object = ZEND_THIS;
|
|
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
/* Fetch the object (without resetting its last error code ). */
|
|
bio = Z_INTL_BREAKITERATOR_P(object);
|
|
|
|
/* Return last error message. */
|
|
message = intl_error_get_message(BREAKITER_ERROR_P(bio));
|
|
RETURN_STR(message);
|
|
}
|
|
|
|
U_CFUNC PHP_METHOD(IntlBreakIterator, getIterator)
|
|
{
|
|
ZEND_PARSE_PARAMETERS_NONE();
|
|
|
|
zend_create_internal_iterator_zval(return_value, ZEND_THIS);
|
|
}
|