root/ext/tidy/tidy.c

/* [<][>][^][v][top][bottom][index][help] */

DEFINITIONS

This source file includes following definitions.
  1. ZEND_GET_MODULE
  2. php_tidy_realloc
  3. php_tidy_free
  4. php_tidy_panic
  5. _php_tidy_set_tidy_opt
  6. php_tidy_quick_repair
  7. php_tidy_file_to_mem
  8. tidy_object_free_storage
  9. tidy_object_new
  10. tidy_object_new_node
  11. tidy_object_new_doc
  12. tidy_get_ce_node
  13. tidy_get_ce_doc
  14. tidy_instanciate
  15. tidy_doc_cast_handler
  16. tidy_node_cast_handler
  17. tidy_doc_update_properties
  18. tidy_add_default_properties
  19. php_tidy_get_opt_val
  20. php_tidy_create_node
  21. _php_tidy_apply_config_array
  22. php_tidy_parse_string
  23. PHP_MINIT_FUNCTION
  24. PHP_RINIT_FUNCTION
  25. PHP_MSHUTDOWN_FUNCTION
  26. PHP_MINFO_FUNCTION
  27. PHP_FUNCTION
  28. PHP_FUNCTION
  29. PHP_FUNCTION
  30. PHP_FUNCTION
  31. PHP_FUNCTION
  32. PHP_FUNCTION
  33. PHP_FUNCTION
  34. PHP_FUNCTION
  35. PHP_FUNCTION
  36. PHP_FUNCTION
  37. PHP_FUNCTION
  38. PHP_FUNCTION
  39. PHP_FUNCTION
  40. PHP_FUNCTION
  41. PHP_FUNCTION
  42. PHP_FUNCTION
  43. PHP_FUNCTION
  44. PHP_FUNCTION
  45. PHP_FUNCTION
  46. PHP_FUNCTION
  47. PHP_FUNCTION
  48. TIDY_DOC_METHOD
  49. TIDY_DOC_METHOD
  50. TIDY_DOC_METHOD
  51. PHP_FUNCTION
  52. PHP_FUNCTION
  53. PHP_FUNCTION
  54. PHP_FUNCTION
  55. TIDY_NODE_METHOD
  56. TIDY_NODE_METHOD
  57. TIDY_NODE_METHOD
  58. TIDY_NODE_METHOD
  59. TIDY_NODE_METHOD
  60. TIDY_NODE_METHOD
  61. TIDY_NODE_METHOD
  62. TIDY_NODE_METHOD
  63. TIDY_NODE_METHOD
  64. _php_tidy_register_nodetypes
  65. _php_tidy_register_tags

/*
  +----------------------------------------------------------------------+
  | PHP Version 5                                                        |
  +----------------------------------------------------------------------+
  | Copyright (c) 1997-2008 The PHP Group                                |
  +----------------------------------------------------------------------+
  | This source file is subject to version 3.01 of the PHP license,      |
  | that is bundled with this package in the file LICENSE, and is        |
  | available through the world-wide-web at the following url:           |
  | http://www.php.net/license/3_01.txt                                  |
  | If you did not receive a copy of the PHP license and are unable to   |
  | obtain it through the world-wide-web, please send a note to          |
  | license@php.net so we can mail you a copy immediately.               |
  +----------------------------------------------------------------------+
  | Author: John Coggeshall <john@php.net>                               |
  +----------------------------------------------------------------------+
*/

/* $Id: tidy.c,v 1.66.2.8.2.25 2007/12/31 07:20:14 sebastian Exp $ */

#ifdef HAVE_CONFIG_H
#include "config.h"
#endif

#include "php.h"
#include "php_tidy.h"

#if HAVE_TIDY

#include "php_ini.h"
#include "ext/standard/info.h"
#include "safe_mode.h"

#include "tidy.h"
#include "buffio.h"

/* compatibility with older versions of libtidy */
#ifndef TIDY_CALL
#define TIDY_CALL
#endif

#define PHP_TIDY_MODULE_VERSION "2.0"

/* {{{ ext/tidy macros
*/
#define TIDY_SET_CONTEXT \
    zval *object = getThis();

#define TIDY_FETCH_OBJECT       \
        PHPTidyObj *obj;        \
        TIDY_SET_CONTEXT; \
        if (object) {   \
                if (ZEND_NUM_ARGS()) {  \
                        WRONG_PARAM_COUNT;      \
                }       \
        } else {        \
                if (zend_parse_method_parameters(ZEND_NUM_ARGS() TSRMLS_CC, NULL, "O", &object, tidy_ce_doc) == FAILURE) {      \
                        RETURN_FALSE;   \
                }       \
        }       \
        obj = (PHPTidyObj *) zend_object_store_get_object(object TSRMLS_CC);    \

#define TIDY_FETCH_ONLY_OBJECT  \
        PHPTidyObj *obj;        \
        TIDY_SET_CONTEXT; \
        if (ZEND_NUM_ARGS()) {  \
                WRONG_PARAM_COUNT;      \
        }       \
        obj = (PHPTidyObj *) zend_object_store_get_object(object TSRMLS_CC);    \

#define TIDY_APPLY_CONFIG_ZVAL(_doc, _val) \
    if(_val) { \
        if(Z_TYPE_PP(_val) == IS_ARRAY) { \
            _php_tidy_apply_config_array(_doc, HASH_OF(*_val) TSRMLS_CC); \
        } else { \
            convert_to_string_ex(_val); \
            TIDY_SAFE_MODE_CHECK(Z_STRVAL_PP(_val)); \
            switch (tidyLoadConfig(_doc, Z_STRVAL_PP(_val))) { \
              case -1: \
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "Could not load configuration file '%s'", Z_STRVAL_PP(_val)); \
                break; \
              case 1: \
                php_error_docref(NULL TSRMLS_CC, E_NOTICE, "There were errors while parsing the configuration file '%s'", Z_STRVAL_PP(_val)); \
                break; \
            } \
        } \
    }

#define REGISTER_TIDY_CLASS(classname, name, parent, __flags) \
        { \
                zend_class_entry ce; \
                INIT_CLASS_ENTRY(ce, # classname, tidy_funcs_ ## name); \
                ce.create_object = tidy_object_new_ ## name; \
                tidy_ce_ ## name = zend_register_internal_class_ex(&ce, parent, NULL TSRMLS_CC); \
                tidy_ce_ ## name->ce_flags |= __flags;  \
                memcpy(&tidy_object_handlers_ ## name, zend_get_std_object_handlers(), sizeof(zend_object_handlers)); \
                tidy_object_handlers_ ## name.clone_obj = NULL; \
        }

#define TIDY_TAG_CONST(tag) REGISTER_LONG_CONSTANT("TIDY_TAG_" #tag, TidyTag_##tag, CONST_CS | CONST_PERSISTENT)
#define TIDY_NODE_CONST(name, type) REGISTER_LONG_CONSTANT("TIDY_NODETYPE_" #name, TidyNode_##type, CONST_CS | CONST_PERSISTENT)

#ifndef TRUE
#define TRUE 1
#endif

#ifndef FALSE
#define FALSE 0
#endif

#define ADD_PROPERTY_STRING(_table, _key, _string) \
        { \
                zval *tmp; \
                MAKE_STD_ZVAL(tmp); \
                if (_string) { \
                        ZVAL_STRING(tmp, (char *)_string, 1); \
                } else { \
                        ZVAL_EMPTY_STRING(tmp); \
                } \
                zend_hash_update(_table, #_key, sizeof(#_key), (void *)&tmp, sizeof(zval *), NULL); \
        }

#define ADD_PROPERTY_STRINGL(_table, _key, _string, _len) \
   { \
       zval *tmp; \
       MAKE_STD_ZVAL(tmp); \
       if (_string) { \
           ZVAL_STRINGL(tmp, (char *)_string, _len, 1); \
       } else { \
           ZVAL_EMPTY_STRING(tmp); \
       } \
       zend_hash_update(_table, #_key, sizeof(#_key), (void *)&tmp, sizeof(zval *), NULL); \
   }

#define ADD_PROPERTY_LONG(_table, _key, _long) \
        { \
                zval *tmp; \
                MAKE_STD_ZVAL(tmp); \
                ZVAL_LONG(tmp, _long); \
                zend_hash_update(_table, #_key, sizeof(#_key), (void *)&tmp, sizeof(zval *), NULL); \
        }

#define ADD_PROPERTY_NULL(_table, _key) \
        { \
                zval *tmp; \
                MAKE_STD_ZVAL(tmp); \
                ZVAL_NULL(tmp); \
                zend_hash_update(_table, #_key, sizeof(#_key), (void *)&tmp, sizeof(zval *), NULL); \
        }

#define ADD_PROPERTY_BOOL(_table, _key, _bool) \
    { \
       zval *tmp; \
       MAKE_STD_ZVAL(tmp); \
       ZVAL_BOOL(tmp, _bool); \
       zend_hash_update(_table, #_key, sizeof(#_key), (void *)&tmp, sizeof(zval *), NULL); \
   }

#define TIDY_SAFE_MODE_CHECK(filename) \
if ((PG(safe_mode) && (!php_checkuid(filename, NULL, CHECKUID_CHECK_FILE_AND_DIR))) || php_check_open_basedir(filename TSRMLS_CC)) { \
        RETURN_FALSE; \
} \

#define TIDY_SET_DEFAULT_CONFIG(_doc) \
        if (TG(default_config) && TG(default_config)[0]) { \
                if (tidyLoadConfig(_doc, TG(default_config)) < 0) { \
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to load Tidy configuration file at '%s'.", TG(default_config)); \
                } \
        }
/* }}} */

/* {{{ ext/tidy structs 
*/
typedef struct _PHPTidyDoc PHPTidyDoc;
typedef struct _PHPTidyObj PHPTidyObj;

typedef enum {
        is_node,
        is_doc
} tidy_obj_type;

typedef enum {
        is_root_node,
        is_html_node,
        is_head_node,
        is_body_node
} tidy_base_nodetypes;

struct _PHPTidyDoc {
        TidyDoc     doc;
        TidyBuffer  *errbuf;
        unsigned int ref_count;
};

struct _PHPTidyObj {
        zend_object         std;
        TidyNode            node;
        tidy_obj_type       type;
        PHPTidyDoc          *ptdoc;
};
/* }}} */

/* {{{ ext/tidy prototypes
*/
static char *php_tidy_file_to_mem(char *, zend_bool, int * TSRMLS_DC);
static void tidy_object_free_storage(void * TSRMLS_DC);
static zend_object_value tidy_object_new_node(zend_class_entry * TSRMLS_DC);
static zend_object_value tidy_object_new_doc(zend_class_entry * TSRMLS_DC);
static zend_class_entry *tidy_get_ce_node(zval * TSRMLS_DC);
static zend_class_entry *tidy_get_ce_doc(zval * TSRMLS_DC);
static zval * tidy_instanciate(zend_class_entry *, zval * TSRMLS_DC);
static int tidy_doc_cast_handler(zval *, zval *, int TSRMLS_DC);
static int tidy_node_cast_handler(zval *, zval *, int TSRMLS_DC);
static void tidy_doc_update_properties(PHPTidyObj * TSRMLS_DC);
static void tidy_add_default_properties(PHPTidyObj *, tidy_obj_type TSRMLS_DC);
static void *php_tidy_get_opt_val(PHPTidyDoc *, TidyOption, TidyOptionType * TSRMLS_DC);
static void php_tidy_create_node(INTERNAL_FUNCTION_PARAMETERS, tidy_base_nodetypes);
static int _php_tidy_set_tidy_opt(TidyDoc, char *, zval * TSRMLS_DC);
static int _php_tidy_apply_config_array(TidyDoc doc, HashTable *ht_options TSRMLS_DC);
static void _php_tidy_register_nodetypes(INIT_FUNC_ARGS);
static void _php_tidy_register_tags(INIT_FUNC_ARGS);

static PHP_MINIT_FUNCTION(tidy);
static PHP_MSHUTDOWN_FUNCTION(tidy);
static PHP_RINIT_FUNCTION(tidy);
static PHP_MINFO_FUNCTION(tidy);

static PHP_FUNCTION(tidy_getopt);
static PHP_FUNCTION(tidy_parse_string);
static PHP_FUNCTION(tidy_parse_file);
static PHP_FUNCTION(tidy_clean_repair);
static PHP_FUNCTION(tidy_repair_string);
static PHP_FUNCTION(tidy_repair_file);
static PHP_FUNCTION(tidy_diagnose);
static PHP_FUNCTION(tidy_get_output);
static PHP_FUNCTION(tidy_get_error_buffer);
static PHP_FUNCTION(tidy_get_release);
static PHP_FUNCTION(tidy_get_config);
static PHP_FUNCTION(tidy_get_status);
static PHP_FUNCTION(tidy_get_html_ver);
#if HAVE_TIDYOPTGETDOC
static PHP_FUNCTION(tidy_get_opt_doc);
#endif
static PHP_FUNCTION(tidy_is_xhtml);
static PHP_FUNCTION(tidy_is_xml);
static PHP_FUNCTION(tidy_error_count);
static PHP_FUNCTION(tidy_warning_count);
static PHP_FUNCTION(tidy_access_count);
static PHP_FUNCTION(tidy_config_count);

static PHP_FUNCTION(ob_tidyhandler);

static PHP_FUNCTION(tidy_get_root);
static PHP_FUNCTION(tidy_get_html);
static PHP_FUNCTION(tidy_get_head);
static PHP_FUNCTION(tidy_get_body);

static TIDY_DOC_METHOD(__construct);
static TIDY_DOC_METHOD(parseFile);
static TIDY_DOC_METHOD(parseString);

static TIDY_NODE_METHOD(hasChildren);
static TIDY_NODE_METHOD(hasSiblings);
static TIDY_NODE_METHOD(isComment);
static TIDY_NODE_METHOD(isHtml);
static TIDY_NODE_METHOD(isText);
static TIDY_NODE_METHOD(isJste);
static TIDY_NODE_METHOD(isAsp);
static TIDY_NODE_METHOD(isPhp);
static TIDY_NODE_METHOD(getParent);
/* }}} */

ZEND_DECLARE_MODULE_GLOBALS(tidy)

PHP_INI_BEGIN()
STD_PHP_INI_ENTRY("tidy.default_config",        "",     PHP_INI_SYSTEM,         OnUpdateString,         default_config,         zend_tidy_globals,      tidy_globals)
PHP_INI_ENTRY("tidy.clean_output",     "0",    PHP_INI_PERDIR,         NULL)
PHP_INI_END()

static zend_function_entry tidy_functions[] = {
        PHP_FE(tidy_getopt,             NULL)
        PHP_FE(tidy_parse_string,       NULL)
        PHP_FE(tidy_parse_file,         NULL)
        PHP_FE(tidy_get_output,         NULL)
        PHP_FE(tidy_get_error_buffer,   NULL) 
        PHP_FE(tidy_clean_repair,       NULL)
        PHP_FE(tidy_repair_string,      NULL)
        PHP_FE(tidy_repair_file,        NULL)
        PHP_FE(tidy_diagnose,           NULL)
        PHP_FE(tidy_get_release,        NULL)
        PHP_FE(tidy_get_config,         NULL)
        PHP_FE(tidy_get_status,         NULL)
        PHP_FE(tidy_get_html_ver,       NULL)
        PHP_FE(tidy_is_xhtml,           NULL)
        PHP_FE(tidy_is_xml,             NULL)
        PHP_FE(tidy_error_count,        NULL)
        PHP_FE(tidy_warning_count,      NULL)
        PHP_FE(tidy_access_count,       NULL)
        PHP_FE(tidy_config_count,       NULL) 
#if HAVE_TIDYOPTGETDOC
        PHP_FE(tidy_get_opt_doc,        NULL)
#endif
        PHP_FE(tidy_get_root,           NULL)
        PHP_FE(tidy_get_head,           NULL)
        PHP_FE(tidy_get_html,           NULL)
        PHP_FE(tidy_get_body,           NULL)
        PHP_FE(ob_tidyhandler,          NULL)
        {NULL, NULL, NULL}
};

static zend_function_entry tidy_funcs_doc[] = {
        TIDY_METHOD_MAP(getOpt, tidy_getopt, NULL)
        TIDY_METHOD_MAP(cleanRepair, tidy_clean_repair, NULL)
        TIDY_DOC_ME(parseFile, NULL)
        TIDY_DOC_ME(parseString, NULL)
        TIDY_METHOD_MAP(repairString, tidy_repair_string, NULL)
        TIDY_METHOD_MAP(repairFile, tidy_repair_file, NULL)
        TIDY_METHOD_MAP(diagnose, tidy_diagnose, NULL)
        TIDY_METHOD_MAP(getRelease, tidy_get_release, NULL)
        TIDY_METHOD_MAP(getConfig, tidy_get_config, NULL)
        TIDY_METHOD_MAP(getStatus, tidy_get_status, NULL)
        TIDY_METHOD_MAP(getHtmlVer, tidy_get_html_ver, NULL)
#if HAVE_TIDYOPTGETDOC
        TIDY_METHOD_MAP(getOptDoc, tidy_get_opt_doc, NULL)
#endif
        TIDY_METHOD_MAP(isXhtml, tidy_is_xhtml, NULL)
        TIDY_METHOD_MAP(isXml, tidy_is_xml, NULL)
        TIDY_METHOD_MAP(root, tidy_get_root, NULL)
        TIDY_METHOD_MAP(head, tidy_get_head, NULL)
        TIDY_METHOD_MAP(html, tidy_get_html, NULL)
        TIDY_METHOD_MAP(body, tidy_get_body, NULL)
        TIDY_DOC_ME(__construct, NULL)
        {NULL, NULL, NULL}
};

static zend_function_entry tidy_funcs_node[] = {
        TIDY_NODE_ME(hasChildren, NULL)
        TIDY_NODE_ME(hasSiblings, NULL)
        TIDY_NODE_ME(isComment, NULL)
        TIDY_NODE_ME(isHtml, NULL)
        TIDY_NODE_ME(isText, NULL)
        TIDY_NODE_ME(isJste, NULL)
        TIDY_NODE_ME(isAsp, NULL)
        TIDY_NODE_ME(isPhp, NULL)
        TIDY_NODE_ME(getParent, NULL)
        {NULL, NULL, NULL}
};

static zend_class_entry *tidy_ce_doc, *tidy_ce_node;

static zend_object_handlers tidy_object_handlers_doc;
static zend_object_handlers tidy_object_handlers_node;

zend_module_entry tidy_module_entry = {
        STANDARD_MODULE_HEADER,
        "tidy",
        tidy_functions,
        PHP_MINIT(tidy),
        PHP_MSHUTDOWN(tidy),
        PHP_RINIT(tidy),
        NULL,
        PHP_MINFO(tidy),
        PHP_TIDY_MODULE_VERSION,
        PHP_MODULE_GLOBALS(tidy),
        NULL,
        NULL,
        NULL,
        STANDARD_MODULE_PROPERTIES_EX
};

#ifdef COMPILE_DL_TIDY
ZEND_GET_MODULE(tidy)
#endif

static void* TIDY_CALL php_tidy_malloc(size_t len)
{
        return emalloc(len);
}

static void* TIDY_CALL php_tidy_realloc(void *buf, size_t len)
{
        return erealloc(buf, len);
}

static void TIDY_CALL php_tidy_free(void *buf)
{
        efree(buf);
}

static void TIDY_CALL php_tidy_panic(ctmbstr msg)
{
        TSRMLS_FETCH();
        php_error_docref(NULL TSRMLS_CC, E_ERROR, "Could not allocate memory for tidy! (Reason: %s)", (char *)msg);
}

static int _php_tidy_set_tidy_opt(TidyDoc doc, char *optname, zval *value TSRMLS_DC)
{
        TidyOption opt = tidyGetOptionByName(doc, optname);
        zval conv = *value;

        if (!opt) {
                php_error_docref(NULL TSRMLS_CC, E_NOTICE, "Unknown Tidy Configuration Option '%s'", optname);
                return FAILURE;
        }
        
        if (tidyOptIsReadOnly(opt)) {
                php_error_docref(NULL TSRMLS_CC, E_NOTICE, "Attempting to set read-only option '%s'", optname);
                return FAILURE;
        }

        switch(tidyOptGetType(opt)) {
                case TidyString:
                        if (Z_TYPE(conv) != IS_STRING) {
                                zval_copy_ctor(&conv);
                                convert_to_string(&conv);
                        }
                        if (tidyOptSetValue(doc, tidyOptGetId(opt), Z_STRVAL(conv))) {
                                if (Z_TYPE(conv) != Z_TYPE_P(value)) {
                                        zval_dtor(&conv);
                                }
                                return SUCCESS;
                        }
                        if (Z_TYPE(conv) != Z_TYPE_P(value)) {
                                zval_dtor(&conv);
                        }
                        break;

                case TidyInteger:
                        if (Z_TYPE(conv) != IS_LONG) {
                                zval_copy_ctor(&conv);
                                convert_to_long(&conv);
                        }
                        if (tidyOptSetInt(doc, tidyOptGetId(opt), Z_LVAL(conv))) {
                                return SUCCESS;
                        }
                        break;

                case TidyBoolean:
                        if (Z_TYPE(conv) != IS_LONG) {
                                zval_copy_ctor(&conv);
                                convert_to_long(&conv);
                        }
                        if (tidyOptSetBool(doc, tidyOptGetId(opt), Z_LVAL(conv))) {
                                return SUCCESS;
                        }
                        break;

                default:
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to determine type of configuration option");
                        break;
        }       

        return FAILURE;
}

static void php_tidy_quick_repair(INTERNAL_FUNCTION_PARAMETERS, zend_bool is_file)
{
        char *data=NULL, *arg1, *enc = NULL;
        int arg1_len, enc_len = 0, data_len = 0;
        zend_bool use_include_path = 0;
        TidyDoc doc;
        TidyBuffer *errbuf;
        zval **config;

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|Zsb", &arg1, &arg1_len, &config, &enc, &enc_len, &use_include_path) == FAILURE) {
                RETURN_FALSE;
        }
        
        if (is_file) {
                if (!(data = php_tidy_file_to_mem(arg1, use_include_path, &data_len TSRMLS_CC))) {
                        RETURN_FALSE;
                }
        } else {
                data = arg1;
                data_len = arg1_len;
        }

        doc = tidyCreate();
        errbuf = emalloc(sizeof(TidyBuffer));
        tidyBufInit(errbuf);
        
        if (tidySetErrorBuffer(doc, errbuf) != 0) {
                tidyBufFree(errbuf);
                efree(errbuf);
                tidyRelease(doc);
                php_error_docref(NULL TSRMLS_CC, E_ERROR, "Could not set Tidy error buffer");
        }
        
        tidyOptSetBool(doc, TidyForceOutput, yes);
        tidyOptSetBool(doc, TidyMark, no);
        
        TIDY_SET_DEFAULT_CONFIG(doc);
        
        if (ZEND_NUM_ARGS() > 1) {
                TIDY_APPLY_CONFIG_ZVAL(doc, config);
        }

        if(enc_len) {
                if (tidySetCharEncoding(doc, enc) < 0) {
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Could not set encoding '%s'", enc);
                        RETVAL_FALSE;
                }
        }
        
        if (data) {
                TidyBuffer buf;

                tidyBufInit(&buf);
                tidyBufAppend(&buf, data, data_len);

                if (tidyParseBuffer(doc, &buf) < 0) {
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "%s", errbuf->bp);
                        RETVAL_FALSE;
                } else {
                        if (tidyCleanAndRepair(doc) >= 0) {
                                TidyBuffer output;
                                tidyBufInit(&output);

                                tidySaveBuffer (doc, &output);
                                RETVAL_STRINGL((char*)output.bp, output.size ? output.size-1 : 0, 1);
                                tidyBufFree(&output);
                        } else {
                                RETVAL_FALSE;
                        }
                }
                
                tidyBufFree(&buf);
        }

        if (is_file) {
                efree(data);
        }
        
        tidyBufFree(errbuf);
        efree(errbuf);
        tidyRelease(doc);
}

static char *php_tidy_file_to_mem(char *filename, zend_bool use_include_path, int *len TSRMLS_DC)
{
        php_stream *stream;
        char *data = NULL;

        if (!(stream = php_stream_open_wrapper(filename, "rb", (use_include_path ? USE_PATH : 0) | ENFORCE_SAFE_MODE, NULL))) {
                return NULL;
        }
        if ((*len = (int) php_stream_copy_to_mem(stream, &data, PHP_STREAM_COPY_ALL, 0)) == 0) {
                data = estrdup("");
                *len = 0;
        }
        php_stream_close(stream);

        return data;
}

static void tidy_object_free_storage(void *object TSRMLS_DC)
{
        PHPTidyObj *intern = (PHPTidyObj *)object;

        zend_object_std_dtor(&intern->std TSRMLS_CC);

        if (intern->ptdoc) {
                intern->ptdoc->ref_count--;

                if (intern->ptdoc->ref_count <= 0) {
                        tidyBufFree(intern->ptdoc->errbuf);
                        efree(intern->ptdoc->errbuf);
                        tidyRelease(intern->ptdoc->doc);
                        efree(intern->ptdoc);
                }
        }

        efree(object);
}

static void tidy_object_new(zend_class_entry *class_type, zend_object_handlers *handlers,
                                                        zend_object_value *retval, tidy_obj_type objtype TSRMLS_DC)
{
        PHPTidyObj *intern;
        zval *tmp;

        intern = emalloc(sizeof(PHPTidyObj));
        memset(intern, 0, sizeof(PHPTidyObj));
        zend_object_std_init(&intern->std, class_type TSRMLS_CC);
        
        zend_hash_copy(intern->std.properties, &class_type->default_properties, (copy_ctor_func_t) zval_add_ref, (void *) &tmp, sizeof(zval *));

        switch(objtype) {
                case is_node:
                        break;

                case is_doc:
                        tidySetMallocCall(php_tidy_malloc);
                        tidySetReallocCall(php_tidy_realloc);
                        tidySetFreeCall(php_tidy_free);
                        tidySetPanicCall(php_tidy_panic);

                        intern->ptdoc = emalloc(sizeof(PHPTidyDoc));
                        intern->ptdoc->doc = tidyCreate();
                        intern->ptdoc->ref_count = 1;
                        intern->ptdoc->errbuf = emalloc(sizeof(TidyBuffer));
                        tidyBufInit(intern->ptdoc->errbuf);

                        if (tidySetErrorBuffer(intern->ptdoc->doc, intern->ptdoc->errbuf) != 0) {
                                tidyBufFree(intern->ptdoc->errbuf);
                                efree(intern->ptdoc->errbuf);
                                tidyRelease(intern->ptdoc->doc);
                                efree(intern->ptdoc);
                                efree(intern);
                                php_error_docref(NULL TSRMLS_CC, E_ERROR, "Could not set Tidy error buffer");
                        }

                        tidyOptSetBool(intern->ptdoc->doc, TidyForceOutput, yes);
                        tidyOptSetBool(intern->ptdoc->doc, TidyMark, no);

                        TIDY_SET_DEFAULT_CONFIG(intern->ptdoc->doc);

                        tidy_add_default_properties(intern, is_doc TSRMLS_CC);
                        break;

                default:
                        break;
        }

        retval->handle = zend_objects_store_put(intern, (zend_objects_store_dtor_t)zend_objects_destroy_object, (zend_objects_free_object_storage_t) tidy_object_free_storage, NULL TSRMLS_CC);
        retval->handlers = handlers;
}

static zend_object_value tidy_object_new_node(zend_class_entry *class_type TSRMLS_DC)
{
        zend_object_value retval;
        tidy_object_new(class_type, &tidy_object_handlers_node, &retval, is_node TSRMLS_CC);
        return retval;
}

static zend_object_value tidy_object_new_doc(zend_class_entry *class_type TSRMLS_DC)
{
        zend_object_value retval;
        tidy_object_new(class_type, &tidy_object_handlers_doc, &retval, is_doc TSRMLS_CC);
        return retval;
}

static zend_class_entry *tidy_get_ce_node(zval *object TSRMLS_DC)
{
        return tidy_ce_node;
}

static zend_class_entry *tidy_get_ce_doc(zval *object TSRMLS_DC)
{
        return tidy_ce_doc;
}

static zval * tidy_instanciate(zend_class_entry *pce, zval *object TSRMLS_DC)
{
        if (!object) {
                ALLOC_ZVAL(object);
        }

        Z_TYPE_P(object) = IS_OBJECT;
        object_init_ex(object, pce);
        object->refcount = 1;
        object->is_ref = 1;
        return object;
}

static int tidy_doc_cast_handler(zval *in, zval *out, int type TSRMLS_DC)
{
        TidyBuffer output;
        PHPTidyObj *obj;

        switch(type) {
                case IS_LONG:
                        ZVAL_LONG(out, 0);
                        break;

                case IS_DOUBLE:
                        ZVAL_DOUBLE(out, 0);
                        break;

                case IS_BOOL:
                        ZVAL_BOOL(out, TRUE);
                        break;

                case IS_STRING:
                        obj = (PHPTidyObj *)zend_object_store_get_object(in TSRMLS_CC);
                        tidyBufInit(&output);
                        tidySaveBuffer (obj->ptdoc->doc, &output);
                        ZVAL_STRINGL(out, (char*)output.bp, output.size ? output.size-1 : 0, TRUE);
                        tidyBufFree(&output);
                        break;

                default:
                        return FAILURE;
        }

        return SUCCESS;
}

static int tidy_node_cast_handler(zval *in, zval *out, int type TSRMLS_DC)
{
        TidyBuffer buf;
        PHPTidyObj *obj;

        switch(type) {
                case IS_LONG:
                        ZVAL_LONG(out, 0);
                        break;

                case IS_DOUBLE:
                        ZVAL_DOUBLE(out, 0);
                        break;

                case IS_BOOL:
                        ZVAL_BOOL(out, TRUE);
                        break;

                case IS_STRING:
                        obj = (PHPTidyObj *)zend_object_store_get_object(in TSRMLS_CC);
                        tidyBufInit(&buf);
                        if (obj->ptdoc) {
                                tidyNodeGetText(obj->ptdoc->doc, obj->node, &buf);
                        }
                        ZVAL_STRINGL(out, (char*)buf.bp, buf.size ? buf.size-1 : 0, TRUE);
                        tidyBufFree(&buf);
                        break;

                default:
                        return FAILURE;
        }

        return SUCCESS;
}

static void tidy_doc_update_properties(PHPTidyObj *obj TSRMLS_DC)
{

        TidyBuffer output;
        zval *temp;

        tidyBufInit(&output);
        tidySaveBuffer (obj->ptdoc->doc, &output);
        
        if (output.size) {
                MAKE_STD_ZVAL(temp);
                ZVAL_STRINGL(temp, (char*)output.bp, output.size-1, TRUE);
                zend_hash_update(obj->std.properties, "value", sizeof("value"), (void *)&temp, sizeof(zval *), NULL);
        }
        
        tidyBufFree(&output);

        if (obj->ptdoc->errbuf->size) {
                MAKE_STD_ZVAL(temp);
                ZVAL_STRINGL(temp, (char*)obj->ptdoc->errbuf->bp, obj->ptdoc->errbuf->size-1, TRUE);
                zend_hash_update(obj->std.properties, "errorBuffer", sizeof("errorBuffer"), (void *)&temp, sizeof(zval *), NULL);
        }
}

static void tidy_add_default_properties(PHPTidyObj *obj, tidy_obj_type type TSRMLS_DC)
{

        TidyBuffer buf;
        TidyAttr        tempattr;
        TidyNode        tempnode;
        zval *attribute, *children, *temp;
        PHPTidyObj *newobj;

        switch(type) {

                case is_node:
                        tidyBufInit(&buf);
                        tidyNodeGetText(obj->ptdoc->doc, obj->node, &buf);
                        ADD_PROPERTY_STRINGL(obj->std.properties, value, buf.bp, buf.size-1);
                        tidyBufFree(&buf);

                        ADD_PROPERTY_STRING(obj->std.properties, name, tidyNodeGetName(obj->node));
                        ADD_PROPERTY_LONG(obj->std.properties, type, tidyNodeGetType(obj->node));
                        ADD_PROPERTY_LONG(obj->std.properties, line, tidyNodeLine(obj->node));
                        ADD_PROPERTY_LONG(obj->std.properties, column, tidyNodeColumn(obj->node));
                        ADD_PROPERTY_BOOL(obj->std.properties, proprietary, tidyNodeIsProp(obj->ptdoc->doc, obj->node));

                        switch(tidyNodeGetType(obj->node)) {
                                case TidyNode_Root:
                                case TidyNode_DocType:
                                case TidyNode_Text:
                                case TidyNode_Comment:
                                        break;
        
                                default:
                                        ADD_PROPERTY_LONG(obj->std.properties, id, tidyNodeGetId(obj->node));
                        }

                        tempattr = tidyAttrFirst(obj->node);
                        MAKE_STD_ZVAL(attribute);

                        if (tempattr) {
                                char *name, *val;
                                array_init(attribute);

                                do {
                                        name = (char *)tidyAttrName(tempattr);
                                        val = (char *)tidyAttrValue(tempattr);
                                        if (name && val) {
                                                add_assoc_string(attribute, name, val, TRUE);
                                        }
                                } while((tempattr = tidyAttrNext(tempattr)));
                        } else {
                                ZVAL_NULL(attribute);
                        }
                        zend_hash_update(obj->std.properties, "attribute", sizeof("attribute"), (void *)&attribute, sizeof(zval *), NULL);

                        tempnode = tidyGetChild(obj->node);

                        MAKE_STD_ZVAL(children);
                        if (tempnode) {
                                array_init(children);
                                do {
                                        MAKE_STD_ZVAL(temp);
                                        tidy_instanciate(tidy_ce_node, temp TSRMLS_CC);
                                        newobj = (PHPTidyObj *) zend_object_store_get_object(temp TSRMLS_CC);
                                        newobj->node = tempnode;
                                        newobj->type = is_node;
                                        newobj->ptdoc = obj->ptdoc;
                                        newobj->ptdoc->ref_count++;

                                        tidy_add_default_properties(newobj, is_node TSRMLS_CC);
                                        add_next_index_zval(children, temp);

                                } while((tempnode = tidyGetNext(tempnode)));

                        } else {
                                ZVAL_NULL(children);
                        }

                        zend_hash_update(obj->std.properties, "child", sizeof("child"), (void *)&children, sizeof(zval *), NULL);

                        break;

                case is_doc:
                        ADD_PROPERTY_NULL(obj->std.properties, errorBuffer);
                        ADD_PROPERTY_NULL(obj->std.properties, value);
                        break;
        }
}

static void *php_tidy_get_opt_val(PHPTidyDoc *ptdoc, TidyOption opt, TidyOptionType *type TSRMLS_DC)
{
        *type = tidyOptGetType(opt);

        switch (*type) {
                case TidyString: {
                        char *val = (char *) tidyOptGetValue(ptdoc->doc, tidyOptGetId(opt));
                        if (val) {
                                return (void *) estrdup(val);
                        } else {
                                return (void *) estrdup("");
                        }
                }
                        break;

                case TidyInteger:
                        return (void *) tidyOptGetInt(ptdoc->doc, tidyOptGetId(opt));
                        break;

                case TidyBoolean:
                        return (void *) tidyOptGetBool(ptdoc->doc, tidyOptGetId(opt));
                        break;
        }

        /* should not happen */
        return NULL;
}

static void php_tidy_create_node(INTERNAL_FUNCTION_PARAMETERS, tidy_base_nodetypes node_type)
{
        PHPTidyObj *newobj;
        TidyNode node;
        TIDY_FETCH_OBJECT;

        switch (node_type) {
                case is_root_node:
                        node = tidyGetRoot(obj->ptdoc->doc);
                        break;

                case is_html_node:
                        node = tidyGetHtml(obj->ptdoc->doc);
                        break;

                case is_head_node:
                        node = tidyGetHead(obj->ptdoc->doc);
                        break;

                case is_body_node:
                        node = tidyGetBody(obj->ptdoc->doc);
                        break;
        }

        if (!node) {
                RETURN_NULL();
        }

        tidy_instanciate(tidy_ce_node, return_value TSRMLS_CC);
        newobj = (PHPTidyObj *) zend_object_store_get_object(return_value TSRMLS_CC);
        newobj->type  = is_node;
        newobj->ptdoc = obj->ptdoc;
        newobj->node  = node;
        newobj->ptdoc->ref_count++;

        tidy_add_default_properties(newobj, is_node TSRMLS_CC);
}

static int _php_tidy_apply_config_array(TidyDoc doc, HashTable *ht_options TSRMLS_DC)
{
        char *opt_name = NULL;
        zval **opt_val;
        ulong opt_indx;
        
        for (zend_hash_internal_pointer_reset(ht_options);
                 zend_hash_get_current_data(ht_options, (void **)&opt_val) == SUCCESS;
                 zend_hash_move_forward(ht_options)) {
                
                if(zend_hash_get_current_key(ht_options, &opt_name, &opt_indx, FALSE) == FAILURE) {
                        php_error_docref(NULL TSRMLS_CC, E_ERROR, "Could not retrieve key from option array");
                        return FAILURE;
                }

                if(opt_name) {
                        _php_tidy_set_tidy_opt(doc, opt_name, *opt_val TSRMLS_CC);
                        opt_name = NULL;
                }
                                        
        }
        
        return SUCCESS;
}

static int php_tidy_parse_string(PHPTidyObj *obj, char *string, int len, char *enc TSRMLS_DC)
{
        TidyBuffer buf;
        
        if(enc) {
                if (tidySetCharEncoding(obj->ptdoc->doc, enc) < 0) {
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Could not set encoding '%s'", enc);
                        return FAILURE;
                }
        }
        
        tidyBufInit(&buf);
        tidyBufAppend(&buf, string, len);
        if (tidyParseBuffer(obj->ptdoc->doc, &buf) < 0) {
                tidyBufFree(&buf);
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "%s", obj->ptdoc->errbuf->bp);
                return FAILURE;
        
        }
        tidyBufFree(&buf);
        tidy_doc_update_properties(obj TSRMLS_CC);

        return SUCCESS;
}

static PHP_MINIT_FUNCTION(tidy)
{
        REGISTER_INI_ENTRIES();
        REGISTER_TIDY_CLASS(tidy, doc,  NULL, 0);
        REGISTER_TIDY_CLASS(tidyNode, node,     NULL, ZEND_ACC_FINAL_CLASS);

        tidy_object_handlers_doc.get_class_entry = tidy_get_ce_doc;
        tidy_object_handlers_node.get_class_entry = tidy_get_ce_node;
        
        tidy_object_handlers_doc.cast_object = tidy_doc_cast_handler;
        tidy_object_handlers_node.cast_object = tidy_node_cast_handler;

        _php_tidy_register_tags(INIT_FUNC_ARGS_PASSTHRU);
        _php_tidy_register_nodetypes(INIT_FUNC_ARGS_PASSTHRU);

        return SUCCESS;
}

static PHP_RINIT_FUNCTION(tidy)
{
        if (INI_BOOL("tidy.clean_output") == TRUE) {
                if (php_start_ob_buffer_named("ob_tidyhandler", 0, 1 TSRMLS_CC) == FAILURE) {
                        zend_error(E_NOTICE, "Failure installing Tidy output buffering.");
                }
        }

        return SUCCESS;
}

static PHP_MSHUTDOWN_FUNCTION(tidy)
{
        UNREGISTER_INI_ENTRIES();
        return SUCCESS;
}

static PHP_MINFO_FUNCTION(tidy)
{
        php_info_print_table_start();
        php_info_print_table_header(2, "Tidy support", "enabled");
        php_info_print_table_row(2, "libTidy Release", (char *)tidyReleaseDate());
        php_info_print_table_row(2, "Extension Version", PHP_TIDY_MODULE_VERSION " ($Id: tidy.c,v 1.66.2.8.2.25 2007/12/31 07:20:14 sebastian Exp $)");
        php_info_print_table_end();

        DISPLAY_INI_ENTRIES();
}

static PHP_FUNCTION(ob_tidyhandler)
{
        char *input;
        int input_len;
        long mode;
        TidyBuffer errbuf;
        TidyDoc doc;

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|l", &input, &input_len, &mode) == FAILURE) {
                return;
        }

        doc = tidyCreate();
        tidyBufInit(&errbuf);

        tidyOptSetBool(doc, TidyForceOutput, yes);
        tidyOptSetBool(doc, TidyMark, no);

        if (tidySetErrorBuffer(doc, &errbuf) != 0) {
                tidyRelease(doc);
                tidyBufFree(&errbuf);

                php_error_docref(NULL TSRMLS_CC, E_ERROR, "Could not set Tidy error buffer");
        }

        TIDY_SET_DEFAULT_CONFIG(doc);

        if (input_len > 1) {
                TidyBuffer buf;
                
                tidyBufInit(&buf);
                tidyBufAppend(&buf, input, input_len);
                
                if (tidyParseBuffer(doc, &buf) < 0 || tidyCleanAndRepair(doc) < 0) {
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "%s", errbuf.bp);
                        RETVAL_NULL();
                } else {
                        TidyBuffer output;
                        tidyBufInit(&output);

                        tidySaveBuffer(doc, &output);
                        RETVAL_STRINGL((char*)output.bp, output.size ? output.size-1 : 0, 1);

                        tidyBufFree(&output);
                }
                
                tidyBufFree(&buf);
        } else {
                RETVAL_NULL();
        }

        tidyRelease(doc);
        tidyBufFree(&errbuf);
}

/* {{{ proto bool tidy_parse_string(string input [, mixed config_options [, string encoding]])
   Parse a document stored in a string */
static PHP_FUNCTION(tidy_parse_string)
{
        char *input, *enc = NULL;
        int input_len, enc_len = 0;
        zval **options = NULL;
        
        PHPTidyObj *obj;

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|Zs", &input, &input_len, &options, &enc, &enc_len) == FAILURE) {
                RETURN_FALSE;
        }

        tidy_instanciate(tidy_ce_doc, return_value TSRMLS_CC);
        obj = (PHPTidyObj *) zend_object_store_get_object(return_value TSRMLS_CC);
                
        TIDY_APPLY_CONFIG_ZVAL(obj->ptdoc->doc, options);
        
        if(php_tidy_parse_string(obj, input, input_len, enc TSRMLS_CC) == FAILURE) {
                zval_dtor(return_value);
                INIT_ZVAL(*return_value);
                RETURN_FALSE;
        }
        
}
/* }}} */

/* {{{ proto string tidy_get_error_buffer([boolean detailed])
   Return warnings and errors which occured parsing the specified document*/
static PHP_FUNCTION(tidy_get_error_buffer)
{
        TIDY_FETCH_OBJECT;

        if (obj->ptdoc->errbuf && obj->ptdoc->errbuf->bp) {
                RETURN_STRINGL((char*)obj->ptdoc->errbuf->bp, obj->ptdoc->errbuf->size-1, 1);
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto string tidy_get_output()
   Return a string representing the parsed tidy markup */
static PHP_FUNCTION(tidy_get_output)
{
        TidyBuffer output;
        TIDY_FETCH_OBJECT;

        tidyBufInit(&output);
        tidySaveBuffer(obj->ptdoc->doc, &output);

        RETVAL_STRINGL((char*)output.bp, output.size ? output.size-1 : 0, 1);

        tidyBufFree(&output);
}
/* }}} */

/* {{{ proto boolean tidy_parse_file(string file [, mixed config_options [, string encoding [, bool use_include_path]]])
   Parse markup in file or URI */
static PHP_FUNCTION(tidy_parse_file)
{
        char *inputfile, *enc = NULL;
        int input_len, contents_len, enc_len = 0;
        zend_bool use_include_path = 0;
        char *contents;
        zval **options = NULL;
        
        PHPTidyObj *obj;

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|Zsb", &inputfile, &input_len,
                                                          &options, &enc, &enc_len, &use_include_path) == FAILURE) {
                RETURN_FALSE;
        }

        tidy_instanciate(tidy_ce_doc, return_value TSRMLS_CC);
        obj = (PHPTidyObj *) zend_object_store_get_object(return_value TSRMLS_CC);

        if (!(contents = php_tidy_file_to_mem(inputfile, use_include_path, &contents_len TSRMLS_CC))) {
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "Cannot Load '%s' into memory %s", inputfile, (use_include_path) ? "(Using include path)" : "");
                RETURN_FALSE;
        }

        TIDY_APPLY_CONFIG_ZVAL(obj->ptdoc->doc, options);

        if(php_tidy_parse_string(obj, contents, contents_len, enc TSRMLS_CC) == FAILURE) {
                zval_dtor(return_value);
                INIT_ZVAL(*return_value);
                RETVAL_FALSE;
        }

        efree(contents);
}
/* }}} */

/* {{{ proto boolean tidy_clean_repair()
   Execute configured cleanup and repair operations on parsed markup */
static PHP_FUNCTION(tidy_clean_repair)
{
        TIDY_FETCH_OBJECT;

        if (tidyCleanAndRepair(obj->ptdoc->doc) >= 0) {
                tidy_doc_update_properties(obj TSRMLS_CC);
                RETURN_TRUE;
        }

        RETURN_FALSE;
}
/* }}} */

/* {{{ proto boolean tidy_repair_string(string data [, mixed config_file [, string encoding]])
   Repair a string using an optionally provided configuration file */
static PHP_FUNCTION(tidy_repair_string)
{
        php_tidy_quick_repair(INTERNAL_FUNCTION_PARAM_PASSTHRU, FALSE);
}
/* }}} */

/* {{{ proto boolean tidy_repair_file(string filename [, mixed config_file [, string encoding [, bool use_include_path]]])
   Repair a file using an optionally provided configuration file */
static PHP_FUNCTION(tidy_repair_file)
{
        php_tidy_quick_repair(INTERNAL_FUNCTION_PARAM_PASSTHRU, TRUE);
}
/* }}} */

/* {{{ proto boolean tidy_diagnose()
   Run configured diagnostics on parsed and repaired markup. */
static PHP_FUNCTION(tidy_diagnose)
{
        TIDY_FETCH_OBJECT;

        if (tidyRunDiagnostics(obj->ptdoc->doc) >= 0) {
                tidy_doc_update_properties(obj TSRMLS_CC);
                RETURN_TRUE;
        }

        RETURN_FALSE;
}
/* }}} */

/* {{{ proto string tidy_get_release()
   Get release date (version) for Tidy library */
static PHP_FUNCTION(tidy_get_release)
{
        if (ZEND_NUM_ARGS()) {
                WRONG_PARAM_COUNT;
        }

        RETURN_STRING((char *)tidyReleaseDate(), 1);
}
/* }}} */


#if HAVE_TIDYOPTGETDOC
/* {{{ proto string tidy_get_opt_doc(tidy resource, string optname)
   Returns the documentation for the given option name */
static PHP_FUNCTION(tidy_get_opt_doc)
{
        PHPTidyObj *obj;
        char *optname, *optval;
        int optname_len;
        TidyOption opt;

        TIDY_SET_CONTEXT;

        if (object) {
                if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s", &optname, &optname_len) == FAILURE) {
                        RETURN_FALSE;
                }
        } else {
                if (zend_parse_method_parameters(ZEND_NUM_ARGS() TSRMLS_CC, NULL, "Os", &object, tidy_ce_doc, &optname, &optname_len) == FAILURE) {
                        RETURN_FALSE;
                }
        }

        obj = (PHPTidyObj *) zend_object_store_get_object(object TSRMLS_CC);

        opt = tidyGetOptionByName(obj->ptdoc->doc, optname);

        if (!opt) {
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unknown Tidy Configuration Option '%s'", optname);
                RETURN_FALSE;
        }

        if ( (optval = (char *) tidyOptGetDoc(obj->ptdoc->doc, opt)) ) {
                RETURN_STRING(optval, 1);
        }

        RETURN_FALSE;
}
/* }}} */
#endif


/* {{{ proto array tidy_get_config()
   Get current Tidy configuarion */
static PHP_FUNCTION(tidy_get_config)
{
        TidyIterator itOpt;
        char *opt_name;
        void *opt_value;
        TidyOptionType optt;

        TIDY_FETCH_OBJECT;

        itOpt = tidyGetOptionList(obj->ptdoc->doc);

        array_init(return_value);

        while (itOpt) {
                TidyOption opt = tidyGetNextOption(obj->ptdoc->doc, &itOpt);

                opt_name = (char *)tidyOptGetName(opt);
                opt_value = php_tidy_get_opt_val(obj->ptdoc, opt, &optt TSRMLS_CC);
                switch (optt) {
                        case TidyString:
                                add_assoc_string(return_value, opt_name, (char*)opt_value, 0);
                                break;

                        case TidyInteger:
                                add_assoc_long(return_value, opt_name, (long)opt_value);
                                break;

                        case TidyBoolean:
                                add_assoc_bool(return_value, opt_name, (long)opt_value);
                                break;
                }
        }

        return;
}
/* }}} */

/* {{{ proto int tidy_get_status()
   Get status of specfied document. */
static PHP_FUNCTION(tidy_get_status)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyStatus(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto int tidy_get_html_ver()
   Get the Detected HTML version for the specified document. */
static PHP_FUNCTION(tidy_get_html_ver)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyDetectedHtmlVersion(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto boolean tidy_is_xhtml()
   Indicates if the document is a XHTML document. */
static PHP_FUNCTION(tidy_is_xhtml)
{
        TIDY_FETCH_OBJECT;

        RETURN_BOOL(tidyDetectedXhtml(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto boolean tidy_is_xml()
   Indicates if the document is a generic (non HTML/XHTML) XML document. */
static PHP_FUNCTION(tidy_is_xml)
{
        TIDY_FETCH_OBJECT;

        RETURN_BOOL(tidyDetectedGenericXml(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto int tidy_error_count()
   Returns the Number of Tidy errors encountered for specified document. */
static PHP_FUNCTION(tidy_error_count)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyErrorCount(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto int tidy_warning_count()
   Returns the Number of Tidy warnings encountered for specified document. */
static PHP_FUNCTION(tidy_warning_count)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyWarningCount(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto int tidy_access_count()
   Returns the Number of Tidy accessibility warnings encountered for specified document. */
static PHP_FUNCTION(tidy_access_count)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyAccessWarningCount(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto int tidy_config_count()
   Returns the Number of Tidy configuration errors encountered for specified document. */
static PHP_FUNCTION(tidy_config_count)
{
        TIDY_FETCH_OBJECT;

        RETURN_LONG(tidyConfigErrorCount(obj->ptdoc->doc));
}
/* }}} */

/* {{{ proto mixed tidy_getopt(string option)
   Returns the value of the specified configuration option for the tidy document. */
static PHP_FUNCTION(tidy_getopt)
{  
        PHPTidyObj *obj;
        char *optname;
        void *optval;
        int optname_len;
        TidyOption opt;
        TidyOptionType optt;
        
        TIDY_SET_CONTEXT;

        if (object) {
                if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s", &optname, &optname_len) == FAILURE) {
                        RETURN_FALSE;
                }
        } else {
                if (zend_parse_method_parameters(ZEND_NUM_ARGS() TSRMLS_CC, NULL, "Os", &object, tidy_ce_doc, &optname, &optname_len) == FAILURE) {
                        RETURN_FALSE;
                }
        }

        obj = (PHPTidyObj *) zend_object_store_get_object(object TSRMLS_CC);

        opt = tidyGetOptionByName(obj->ptdoc->doc, optname);

        if (!opt) {
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unknown Tidy Configuration Option '%s'", optname);
                RETURN_FALSE;
        }

        optval = php_tidy_get_opt_val(obj->ptdoc, opt, &optt TSRMLS_CC);
        switch (optt) {
                case TidyString:
                        RETURN_STRING((char *)optval, 0);
                        break;

                case TidyInteger:
                        RETURN_LONG((long)optval);
                        break;

                case TidyBoolean:
                        if (optval) {
                                RETURN_TRUE;
                        } else {
                                RETURN_FALSE;
                        }
                        break;

                default:
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to determine type of configuration option");
                        break;
        }

        RETURN_FALSE;
}
/* }}} */

static TIDY_DOC_METHOD(__construct)
{
        char *inputfile = NULL, *enc = NULL;
        int input_len = 0, enc_len = 0, contents_len = 0;
        zend_bool use_include_path = 0;
        char *contents;
        zval **options = NULL;
        
        PHPTidyObj *obj;
        TIDY_SET_CONTEXT;       
        
        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "|sZsb", &inputfile, &input_len,
                                                          &options, &enc, &enc_len, &use_include_path) == FAILURE) {
                RETURN_FALSE;
        }
        
        obj = (PHPTidyObj *)zend_object_store_get_object(object TSRMLS_CC);
        
        if (inputfile) {
                if (!(contents = php_tidy_file_to_mem(inputfile, use_include_path, &contents_len TSRMLS_CC))) {
                        php_error_docref(NULL TSRMLS_CC, E_WARNING, "Cannot Load '%s' into memory %s", inputfile, (use_include_path) ? "(Using include path)" : "");
                        return;
                }

                TIDY_APPLY_CONFIG_ZVAL(obj->ptdoc->doc, options);

                php_tidy_parse_string(obj, contents, contents_len, enc TSRMLS_CC);

                efree(contents);
        }
}

static TIDY_DOC_METHOD(parseFile)
{
        char *inputfile, *enc = NULL;
        int input_len, enc_len = 0, contents_len = 0;
        zend_bool use_include_path = 0;
        char *contents;
        zval **options = NULL;
        PHPTidyObj *obj;

        TIDY_SET_CONTEXT;

        obj = (PHPTidyObj *)zend_object_store_get_object(object TSRMLS_CC);

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|Zsb", &inputfile, &input_len,
                                                          &options, &enc, &enc_len, &use_include_path) == FAILURE) {
                RETURN_FALSE;
        }
        
        if (!(contents = php_tidy_file_to_mem(inputfile, use_include_path, &contents_len TSRMLS_CC))) {
                php_error_docref(NULL TSRMLS_CC, E_WARNING, "Cannot Load '%s' into memory %s", inputfile, (use_include_path) ? "(Using include path)" : "");
                RETURN_FALSE;
        }

        TIDY_APPLY_CONFIG_ZVAL(obj->ptdoc->doc, options);

        if(php_tidy_parse_string(obj, contents, contents_len, enc TSRMLS_CC) == FAILURE) {
                RETVAL_FALSE;
        } else {
                RETVAL_TRUE;
        }

        efree(contents);
}

static TIDY_DOC_METHOD(parseString)
{
        char *input, *enc = NULL;
        int input_len, enc_len = 0;
        zval **options = NULL;
        PHPTidyObj *obj;

        TIDY_SET_CONTEXT;

        if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s|Zs", &input, &input_len, &options, &enc, &enc_len) == FAILURE) {
                RETURN_FALSE;
        }

        obj = (PHPTidyObj *)zend_object_store_get_object(object TSRMLS_CC);

        TIDY_APPLY_CONFIG_ZVAL(obj->ptdoc->doc, options);

        if(php_tidy_parse_string(obj, input, input_len, enc TSRMLS_CC) == SUCCESS) {
                RETURN_TRUE;
        }
        
        RETURN_FALSE;
}


/* {{{ proto TidyNode tidy_get_root()
   Returns a TidyNode Object representing the root of the tidy parse tree */
static PHP_FUNCTION(tidy_get_root)
{
        php_tidy_create_node(INTERNAL_FUNCTION_PARAM_PASSTHRU, is_root_node);
}
/* }}} */

/* {{{ proto TidyNode tidy_get_html()
   Returns a TidyNode Object starting from the <HTML> tag of the tidy parse tree */
static PHP_FUNCTION(tidy_get_html)
{
        php_tidy_create_node(INTERNAL_FUNCTION_PARAM_PASSTHRU, is_html_node);
}
/* }}} */

/* {{{ proto TidyNode tidy_get_head()
   Returns a TidyNode Object starting from the <HEAD> tag of the tidy parse tree */
static PHP_FUNCTION(tidy_get_head)
{
        php_tidy_create_node(INTERNAL_FUNCTION_PARAM_PASSTHRU, is_head_node);
}
/* }}} */

/* {{{ proto TidyNode tidy_get_body(resource tidy)
   Returns a TidyNode Object starting from the <BODY> tag of the tidy parse tree */
static PHP_FUNCTION(tidy_get_body)
{
        php_tidy_create_node(INTERNAL_FUNCTION_PARAM_PASSTHRU, is_body_node);
}
/* }}} */

/* {{{ proto boolean tidyNode::hasChildren()
   Returns true if this node has children */
static TIDY_NODE_METHOD(hasChildren)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyGetChild(obj->node)) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::hasSiblings()
   Returns true if this node has siblings */
static TIDY_NODE_METHOD(hasSiblings)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (obj->node && tidyGetNext(obj->node)) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::isComment()
   Returns true if this node represents a comment */
static TIDY_NODE_METHOD(isComment)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) == TidyNode_Comment) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::isHtml()
   Returns true if this node is part of a HTML document */
static TIDY_NODE_METHOD(isHtml)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) & (TidyNode_Start | TidyNode_End | TidyNode_StartEnd)) {
                RETURN_TRUE;
        }

        RETURN_FALSE;
}
/* }}} */

/* {{{ proto boolean tidyNode::isText()
   Returns true if this node represents text (no markup) */
static TIDY_NODE_METHOD(isText)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) == TidyNode_Text) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::isJste()
   Returns true if this node is JSTE */
static TIDY_NODE_METHOD(isJste)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) == TidyNode_Jste) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::isAsp()
   Returns true if this node is ASP */
static TIDY_NODE_METHOD(isAsp)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) == TidyNode_Asp) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto boolean tidyNode::isPhp()
   Returns true if this node is PHP */
static TIDY_NODE_METHOD(isPhp)
{
        TIDY_FETCH_ONLY_OBJECT;

        if (tidyNodeGetType(obj->node) == TidyNode_Php) {
                RETURN_TRUE;
        } else {
                RETURN_FALSE;
        }
}
/* }}} */

/* {{{ proto tidyNode tidyNode::getParent()
   Returns the parent node if available or NULL */
static TIDY_NODE_METHOD(getParent)
{
        TidyNode        parent_node;
        PHPTidyObj *newobj;
        TIDY_FETCH_ONLY_OBJECT;

        parent_node = tidyGetParent(obj->node);
        if(parent_node) {
                tidy_instanciate(tidy_ce_node, return_value TSRMLS_CC);
                newobj = (PHPTidyObj *) zend_object_store_get_object(return_value TSRMLS_CC);
                newobj->node = parent_node;
                newobj->type = is_node;
                newobj->ptdoc = obj->ptdoc;
                newobj->ptdoc->ref_count++;
                tidy_add_default_properties(newobj, is_node TSRMLS_CC);
        } else {
                ZVAL_NULL(return_value);
        }
}
/* }}} */

static void _php_tidy_register_nodetypes(INIT_FUNC_ARGS)
{
        TIDY_NODE_CONST(ROOT, Root);
        TIDY_NODE_CONST(DOCTYPE, DocType);
        TIDY_NODE_CONST(COMMENT, Comment);
        TIDY_NODE_CONST(PROCINS, ProcIns);
        TIDY_NODE_CONST(TEXT, Text);
        TIDY_NODE_CONST(START, Start);
        TIDY_NODE_CONST(END, End);
        TIDY_NODE_CONST(STARTEND, StartEnd);
        TIDY_NODE_CONST(CDATA, CDATA);
        TIDY_NODE_CONST(SECTION, Section);
        TIDY_NODE_CONST(ASP, Asp);
        TIDY_NODE_CONST(JSTE, Jste);
        TIDY_NODE_CONST(PHP, Php);
        TIDY_NODE_CONST(XMLDECL, XmlDecl);
}

static void _php_tidy_register_tags(INIT_FUNC_ARGS)
{
        TIDY_TAG_CONST(UNKNOWN);
        TIDY_TAG_CONST(A);
        TIDY_TAG_CONST(ABBR);
        TIDY_TAG_CONST(ACRONYM);
        TIDY_TAG_CONST(ADDRESS);
        TIDY_TAG_CONST(ALIGN);
        TIDY_TAG_CONST(APPLET);
        TIDY_TAG_CONST(AREA);
        TIDY_TAG_CONST(B);
        TIDY_TAG_CONST(BASE);
        TIDY_TAG_CONST(BASEFONT);
        TIDY_TAG_CONST(BDO);
        TIDY_TAG_CONST(BGSOUND);
        TIDY_TAG_CONST(BIG);
        TIDY_TAG_CONST(BLINK);
        TIDY_TAG_CONST(BLOCKQUOTE);
        TIDY_TAG_CONST(BODY);
        TIDY_TAG_CONST(BR);
        TIDY_TAG_CONST(BUTTON);
        TIDY_TAG_CONST(CAPTION);
        TIDY_TAG_CONST(CENTER);
        TIDY_TAG_CONST(CITE);
        TIDY_TAG_CONST(CODE);
        TIDY_TAG_CONST(COL);
        TIDY_TAG_CONST(COLGROUP);
        TIDY_TAG_CONST(COMMENT);
        TIDY_TAG_CONST(DD);
        TIDY_TAG_CONST(DEL);
        TIDY_TAG_CONST(DFN);
        TIDY_TAG_CONST(DIR);
        TIDY_TAG_CONST(DIV);
        TIDY_TAG_CONST(DL);
        TIDY_TAG_CONST(DT);
        TIDY_TAG_CONST(EM);
        TIDY_TAG_CONST(EMBED);
        TIDY_TAG_CONST(FIELDSET);
        TIDY_TAG_CONST(FONT);
        TIDY_TAG_CONST(FORM);
        TIDY_TAG_CONST(FRAME);
        TIDY_TAG_CONST(FRAMESET);
        TIDY_TAG_CONST(H1);
        TIDY_TAG_CONST(H2);
        TIDY_TAG_CONST(H3);
        TIDY_TAG_CONST(H4);
        TIDY_TAG_CONST(H5);
        TIDY_TAG_CONST(H6);
        TIDY_TAG_CONST(HEAD);
        TIDY_TAG_CONST(HR);
        TIDY_TAG_CONST(HTML);
        TIDY_TAG_CONST(I);
        TIDY_TAG_CONST(IFRAME);
        TIDY_TAG_CONST(ILAYER);
        TIDY_TAG_CONST(IMG);
        TIDY_TAG_CONST(INPUT);
        TIDY_TAG_CONST(INS);
        TIDY_TAG_CONST(ISINDEX);
        TIDY_TAG_CONST(KBD);
        TIDY_TAG_CONST(KEYGEN);
        TIDY_TAG_CONST(LABEL);
        TIDY_TAG_CONST(LAYER);
        TIDY_TAG_CONST(LEGEND);
        TIDY_TAG_CONST(LI);
        TIDY_TAG_CONST(LINK);
        TIDY_TAG_CONST(LISTING);
        TIDY_TAG_CONST(MAP);
        TIDY_TAG_CONST(MARQUEE);
        TIDY_TAG_CONST(MENU);
        TIDY_TAG_CONST(META);
        TIDY_TAG_CONST(MULTICOL);
        TIDY_TAG_CONST(NOBR);
        TIDY_TAG_CONST(NOEMBED);
        TIDY_TAG_CONST(NOFRAMES);
        TIDY_TAG_CONST(NOLAYER);
        TIDY_TAG_CONST(NOSAVE);
        TIDY_TAG_CONST(NOSCRIPT);
        TIDY_TAG_CONST(OBJECT);
        TIDY_TAG_CONST(OL);
        TIDY_TAG_CONST(OPTGROUP);
        TIDY_TAG_CONST(OPTION);
        TIDY_TAG_CONST(P);
        TIDY_TAG_CONST(PARAM);
        TIDY_TAG_CONST(PLAINTEXT);
        TIDY_TAG_CONST(PRE);
        TIDY_TAG_CONST(Q);
        TIDY_TAG_CONST(RB);
        TIDY_TAG_CONST(RBC);
        TIDY_TAG_CONST(RP);
        TIDY_TAG_CONST(RT);
        TIDY_TAG_CONST(RTC);
        TIDY_TAG_CONST(RUBY);
        TIDY_TAG_CONST(S);
        TIDY_TAG_CONST(SAMP);
        TIDY_TAG_CONST(SCRIPT);
        TIDY_TAG_CONST(SELECT);
        TIDY_TAG_CONST(SERVER);
        TIDY_TAG_CONST(SERVLET);
        TIDY_TAG_CONST(SMALL);
        TIDY_TAG_CONST(SPACER);
        TIDY_TAG_CONST(SPAN);
        TIDY_TAG_CONST(STRIKE);
        TIDY_TAG_CONST(STRONG);
        TIDY_TAG_CONST(STYLE);
        TIDY_TAG_CONST(SUB);
        TIDY_TAG_CONST(SUP);
        TIDY_TAG_CONST(TABLE);
        TIDY_TAG_CONST(TBODY);
        TIDY_TAG_CONST(TD);
        TIDY_TAG_CONST(TEXTAREA);
        TIDY_TAG_CONST(TFOOT);
        TIDY_TAG_CONST(TH);
        TIDY_TAG_CONST(THEAD);
        TIDY_TAG_CONST(TITLE);
        TIDY_TAG_CONST(TR);
        TIDY_TAG_CONST(TT);
        TIDY_TAG_CONST(U);
        TIDY_TAG_CONST(UL);
        TIDY_TAG_CONST(VAR);
        TIDY_TAG_CONST(WBR);
        TIDY_TAG_CONST(XMP);
}

#endif

/*
 * Local variables:
 * tab-width: 4
 * c-basic-offset: 4
 * End:
 * vim600: noet sw=4 ts=4 fdm=marker
 * vim<600: noet sw=4 ts=4
 */

/* [<][>][^][v][top][bottom][index][help] */