mirror of
https://github.com/php/php-src.git
synced 2025-08-16 14:08:47 +02:00

Use our own string builder instead of using libxml's and then having to copy over. For the following test: ``` $dom = Dom\HTMLDocument::createEmpty(); $root = $dom->appendChild($dom->createElement('root')); $root->append('abc', 'def', 'ghi'); $f = $root->firstChild; for ($i = 0; $i < 1000000; $i++) $f->wholeText; ``` The following results were obtained on an i7-4790: ``` Benchmark 1: ./sapi/cli/php x.php Time (mean ± σ): 57.2 ms ± 2.3 ms [User: 53.2 ms, System: 3.4 ms] Range (min … max): 54.7 ms … 69.3 ms 52 runs Benchmark 2: ./sapi/cli/php_old x.php Time (mean ± σ): 89.4 ms ± 3.4 ms [User: 85.6 ms, System: 3.0 ms] Range (min … max): 86.1 ms … 105.8 ms 32 runs Summary ./sapi/cli/php x.php ran 1.56 ± 0.09 times faster than ./sapi/cli/php_old x.php ```
174 lines
4.7 KiB
C
174 lines
4.7 KiB
C
/*
|
|
+----------------------------------------------------------------------+
|
|
| Copyright (c) The PHP Group |
|
|
+----------------------------------------------------------------------+
|
|
| This source file is subject to version 3.01 of the PHP license, |
|
|
| that is bundled with this package in the file LICENSE, and is |
|
|
| available through the world-wide-web at the following url: |
|
|
| https://www.php.net/license/3_01.txt |
|
|
| If you did not receive a copy of the PHP license and are unable to |
|
|
| obtain it through the world-wide-web, please send a note to |
|
|
| license@php.net so we can mail you a copy immediately. |
|
|
+----------------------------------------------------------------------+
|
|
| Authors: Christian Stocker <chregu@php.net> |
|
|
| Rob Richards <rrichards@php.net> |
|
|
+----------------------------------------------------------------------+
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include <config.h>
|
|
#endif
|
|
|
|
#include "php.h"
|
|
#if defined(HAVE_LIBXML) && defined(HAVE_DOM)
|
|
#include "php_dom.h"
|
|
#include "dom_properties.h"
|
|
|
|
/*
|
|
* class DOMText extends DOMCharacterData
|
|
*
|
|
* URL: https://www.w3.org/TR/2003/WD-DOM-Level-3-Core-20030226/DOM3-Core.html#ID-1312295772
|
|
* Since:
|
|
*/
|
|
|
|
/* {{{ */
|
|
PHP_METHOD(DOMText, __construct)
|
|
{
|
|
xmlNodePtr nodep = NULL, oldnode = NULL;
|
|
dom_object *intern;
|
|
char *value = NULL;
|
|
size_t value_len;
|
|
|
|
if (zend_parse_parameters(ZEND_NUM_ARGS(), "|s", &value, &value_len) == FAILURE) {
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
nodep = xmlNewText(BAD_CAST value);
|
|
|
|
if (!nodep) {
|
|
php_dom_throw_error(INVALID_STATE_ERR, true);
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
intern = Z_DOMOBJ_P(ZEND_THIS);
|
|
oldnode = dom_object_get_node(intern);
|
|
if (oldnode != NULL) {
|
|
php_libxml_node_decrement_resource((php_libxml_node_object *)intern);
|
|
}
|
|
php_libxml_increment_node_ptr((php_libxml_node_object *)intern, nodep, (void *)intern);
|
|
}
|
|
/* }}} end DOMText::__construct */
|
|
|
|
/* {{{ wholeText string
|
|
readonly=yes
|
|
URL: http://www.w3.org/TR/2003/WD-DOM-Level-3-Core-20030226/DOM3-Core.html#core-Text3-wholeText
|
|
Since: DOM Level 3
|
|
*/
|
|
zend_result dom_text_whole_text_read(dom_object *obj, zval *retval)
|
|
{
|
|
DOM_PROP_NODE(xmlNodePtr, node, obj);
|
|
|
|
smart_str str = {0};
|
|
|
|
/* Find starting text node */
|
|
while (node->prev && ((node->prev->type == XML_TEXT_NODE) || (node->prev->type == XML_CDATA_SECTION_NODE))) {
|
|
node = node->prev;
|
|
}
|
|
|
|
/* concatenate all adjacent text and cdata nodes */
|
|
while (node && ((node->type == XML_TEXT_NODE) || (node->type == XML_CDATA_SECTION_NODE))) {
|
|
smart_str_appends(&str, (const char *) node->content);
|
|
node = node->next;
|
|
}
|
|
|
|
ZVAL_STR(retval, smart_str_extract(&str));
|
|
|
|
return SUCCESS;
|
|
}
|
|
|
|
/* }}} */
|
|
|
|
/* {{{ URL: http://www.w3.org/TR/2003/WD-DOM-Level-3-Core-20030226/DOM3-Core.html#core-ID-38853C1D
|
|
Modern spec URL: https://dom.spec.whatwg.org/#dom-text-splittext
|
|
Since:
|
|
*/
|
|
PHP_METHOD(DOMText, splitText)
|
|
{
|
|
zval *id;
|
|
xmlChar *first;
|
|
xmlChar *second;
|
|
xmlNodePtr node;
|
|
xmlNodePtr nnode;
|
|
zend_long offset;
|
|
int length;
|
|
dom_object *intern;
|
|
|
|
id = ZEND_THIS;
|
|
if (zend_parse_parameters(ZEND_NUM_ARGS(), "l", &offset) == FAILURE) {
|
|
RETURN_THROWS();
|
|
}
|
|
DOM_GET_OBJ(node, id, xmlNodePtr, intern);
|
|
|
|
if (offset < 0) {
|
|
zend_argument_value_error(1, "must be greater than or equal to 0");
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
const xmlChar *cur = php_dom_get_content_or_empty(node);
|
|
length = xmlUTF8Strlen(cur);
|
|
|
|
if (ZEND_LONG_INT_OVFL(offset) || (int)offset > length) {
|
|
if (php_dom_follow_spec_intern(intern)) {
|
|
php_dom_throw_error(INDEX_SIZE_ERR, /* strict */ true);
|
|
}
|
|
RETURN_FALSE;
|
|
}
|
|
|
|
first = xmlUTF8Strndup(cur, (int)offset);
|
|
second = xmlUTF8Strsub(cur, (int)offset, (int)(length - offset));
|
|
|
|
xmlNodeSetContent(node, first);
|
|
nnode = xmlNewDocText(node->doc, second);
|
|
|
|
xmlFree(first);
|
|
xmlFree(second);
|
|
|
|
if (nnode == NULL) {
|
|
php_dom_throw_error(INVALID_STATE_ERR, /* strict */ true);
|
|
RETURN_THROWS();
|
|
}
|
|
|
|
if (node->parent != NULL) {
|
|
nnode->type = XML_ELEMENT_NODE;
|
|
xmlAddNextSibling(node, nnode);
|
|
nnode->type = XML_TEXT_NODE;
|
|
}
|
|
|
|
php_dom_create_object(nnode, return_value, intern);
|
|
}
|
|
/* }}} end dom_text_split_text */
|
|
|
|
/* {{{ URL: http://www.w3.org/TR/2003/WD-DOM-Level-3-Core-20030226/DOM3-Core.html#core-Text3-isWhitespaceInElementContent
|
|
Since: DOM Level 3
|
|
*/
|
|
PHP_METHOD(DOMText, isWhitespaceInElementContent)
|
|
{
|
|
zval *id;
|
|
xmlNodePtr node;
|
|
dom_object *intern;
|
|
|
|
id = ZEND_THIS;
|
|
if (zend_parse_parameters_none() == FAILURE) {
|
|
RETURN_THROWS();
|
|
}
|
|
DOM_GET_OBJ(node, id, xmlNodePtr, intern);
|
|
|
|
if (xmlIsBlankNode(node)) {
|
|
RETURN_TRUE;
|
|
} else {
|
|
RETURN_FALSE;
|
|
}
|
|
}
|
|
/* }}} end dom_text_is_whitespace_in_element_content */
|
|
|
|
#endif
|