2010-03-28 22:10:10 +00:00
|
|
|
<?xml version="1.0" encoding="utf-8"?>
|
2009-07-11 09:08:43 +00:00
|
|
|
<!-- $Revision$ -->
|
2007-06-20 22:25:43 +00:00
|
|
|
<refentry xmlns="http://docbook.org/ns/docbook" xml:id="function.html-entity-decode">
|
2007-06-15 19:01:26 +00:00
|
|
|
<refnamediv>
|
|
|
|
<refname>html_entity_decode</refname>
|
|
|
|
<refpurpose>Convert all HTML entities to their applicable characters</refpurpose>
|
|
|
|
</refnamediv>
|
2007-06-15 19:01:57 +00:00
|
|
|
|
|
|
|
<refsect1 role="description">
|
|
|
|
&reftitle.description;
|
2007-06-15 19:01:26 +00:00
|
|
|
<methodsynopsis>
|
|
|
|
<type>string</type><methodname>html_entity_decode</methodname>
|
|
|
|
<methodparam><type>string</type><parameter>string</parameter></methodparam>
|
2009-01-16 16:14:26 +00:00
|
|
|
<methodparam choice="opt"><type>int</type><parameter>quote_style</parameter><initializer>ENT_COMPAT</initializer></methodparam>
|
2007-06-15 19:01:26 +00:00
|
|
|
<methodparam choice="opt"><type>string</type><parameter>charset</parameter></methodparam>
|
|
|
|
</methodsynopsis>
|
|
|
|
<para>
|
|
|
|
<function>html_entity_decode</function> is the opposite of
|
|
|
|
<function>htmlentities</function> in that it converts all HTML entities
|
|
|
|
to their applicable characters from <parameter>string</parameter>.
|
|
|
|
</para>
|
2007-06-15 19:01:57 +00:00
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="parameters">
|
|
|
|
&reftitle.parameters;
|
2007-06-15 19:01:26 +00:00
|
|
|
<para>
|
2007-06-15 19:01:57 +00:00
|
|
|
<variablelist>
|
|
|
|
<varlistentry>
|
|
|
|
<term><parameter>string</parameter></term>
|
|
|
|
<listitem>
|
|
|
|
<para>
|
|
|
|
The input string.
|
|
|
|
</para>
|
|
|
|
</listitem>
|
|
|
|
</varlistentry>
|
|
|
|
<varlistentry>
|
|
|
|
<term><parameter>quote_style</parameter></term>
|
|
|
|
<listitem>
|
|
|
|
<para>
|
|
|
|
The optional second <parameter>quote_style</parameter> parameter lets
|
|
|
|
you define what will be done with 'single' and "double" quotes. It takes
|
|
|
|
on one of three constants with the default being
|
|
|
|
<constant>ENT_COMPAT</constant>:
|
|
|
|
<table>
|
|
|
|
<title>Available <parameter>quote_style</parameter> constants</title>
|
|
|
|
<tgroup cols="2">
|
|
|
|
<thead>
|
|
|
|
<row>
|
|
|
|
<entry>Constant Name</entry>
|
|
|
|
<entry>Description</entry>
|
|
|
|
</row>
|
|
|
|
</thead>
|
|
|
|
<tbody>
|
|
|
|
<row>
|
|
|
|
<entry><constant>ENT_COMPAT</constant></entry>
|
|
|
|
<entry>Will convert double-quotes and leave single-quotes alone.</entry>
|
|
|
|
</row>
|
|
|
|
<row>
|
|
|
|
<entry><constant>ENT_QUOTES</constant></entry>
|
|
|
|
<entry>Will convert both double and single quotes.</entry>
|
|
|
|
</row>
|
|
|
|
<row>
|
|
|
|
<entry><constant>ENT_NOQUOTES</constant></entry>
|
|
|
|
<entry>Will leave both double and single quotes unconverted.</entry>
|
|
|
|
</row>
|
|
|
|
</tbody>
|
|
|
|
</tgroup>
|
|
|
|
</table>
|
|
|
|
</para>
|
|
|
|
</listitem>
|
|
|
|
</varlistentry>
|
|
|
|
<varlistentry>
|
|
|
|
<term><parameter>charset</parameter></term>
|
|
|
|
<listitem>
|
|
|
|
<para>
|
|
|
|
The ISO-8859-1 character set is used as default for the optional third
|
|
|
|
<parameter>charset</parameter>. This defines the character set used in
|
|
|
|
conversion.
|
|
|
|
</para>
|
|
|
|
&reference.strings.charsets;
|
|
|
|
</listitem>
|
|
|
|
</varlistentry>
|
|
|
|
</variablelist>
|
|
|
|
</para>
|
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="returnvalues">
|
|
|
|
&reftitle.returnvalues;
|
|
|
|
<para>
|
|
|
|
Returns the decoded string.
|
|
|
|
</para>
|
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="changelog">
|
|
|
|
&reftitle.changelog;
|
|
|
|
<para>
|
|
|
|
<informaltable>
|
2007-06-15 19:01:26 +00:00
|
|
|
<tgroup cols="2">
|
|
|
|
<thead>
|
|
|
|
<row>
|
2007-06-15 19:01:57 +00:00
|
|
|
<entry>&Version;</entry>
|
|
|
|
<entry>&Description;</entry>
|
2007-06-15 19:01:26 +00:00
|
|
|
</row>
|
|
|
|
</thead>
|
|
|
|
<tbody>
|
|
|
|
<row>
|
2007-06-15 19:01:57 +00:00
|
|
|
<entry>5.0.0</entry>
|
|
|
|
<entry>
|
2007-10-17 10:18:30 +00:00
|
|
|
Support for multi-byte character sets was added.
|
2007-06-15 19:01:57 +00:00
|
|
|
</entry>
|
2007-06-15 19:01:26 +00:00
|
|
|
</row>
|
|
|
|
</tbody>
|
|
|
|
</tgroup>
|
2007-06-15 19:01:57 +00:00
|
|
|
</informaltable>
|
2007-06-15 19:01:26 +00:00
|
|
|
</para>
|
2007-06-15 19:01:57 +00:00
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="examples">
|
|
|
|
&reftitle.examples;
|
2007-06-15 19:01:26 +00:00
|
|
|
<para>
|
|
|
|
<example>
|
|
|
|
<title>Decoding HTML entities</title>
|
|
|
|
<programlisting role="php">
|
2002-11-18 09:28:42 +00:00
|
|
|
<![CDATA[
|
|
|
|
<?php
|
|
|
|
$orig = "I'll \"walk\" the <b>dog</b> now";
|
|
|
|
|
|
|
|
$a = htmlentities($orig);
|
|
|
|
|
|
|
|
$b = html_entity_decode($a);
|
|
|
|
|
|
|
|
echo $a; // I'll "walk" the <b>dog</b> now
|
|
|
|
|
|
|
|
echo $b; // I'll "walk" the <b>dog</b> now
|
|
|
|
|
|
|
|
|
|
|
|
// For users prior to PHP 4.3.0 you may do this:
|
2007-06-15 19:01:26 +00:00
|
|
|
function unhtmlentities($string)
|
2004-01-15 12:43:50 +00:00
|
|
|
{
|
2005-07-11 08:33:42 +00:00
|
|
|
// replace numeric entities
|
|
|
|
$string = preg_replace('~&#x([0-9a-f]+);~ei', 'chr(hexdec("\\1"))', $string);
|
2007-01-24 11:08:02 +00:00
|
|
|
$string = preg_replace('~&#([0-9]+);~e', 'chr("\\1")', $string);
|
2005-07-11 08:33:42 +00:00
|
|
|
// replace literal entities
|
2003-12-15 16:55:22 +00:00
|
|
|
$trans_tbl = get_html_translation_table(HTML_ENTITIES);
|
|
|
|
$trans_tbl = array_flip($trans_tbl);
|
|
|
|
return strtr($string, $trans_tbl);
|
2002-11-18 09:28:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
$c = unhtmlentities($a);
|
|
|
|
|
|
|
|
echo $c; // I'll "walk" the <b>dog</b> now
|
|
|
|
|
|
|
|
?>
|
|
|
|
]]>
|
2007-06-15 19:01:26 +00:00
|
|
|
</programlisting>
|
2007-06-15 19:01:57 +00:00
|
|
|
</example>
|
2007-06-15 19:01:26 +00:00
|
|
|
</para>
|
2007-06-15 19:01:57 +00:00
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="notes">
|
|
|
|
&reftitle.notes;
|
|
|
|
<note>
|
|
|
|
<para>
|
|
|
|
You might wonder why trim(html_entity_decode('&nbsp;')); doesn't
|
|
|
|
reduce the string to an empty string, that's because the '&nbsp;'
|
|
|
|
entity is not ASCII code 32 (which is stripped by
|
|
|
|
<function>trim</function>) but ASCII code 160 (0xa0) in the default ISO
|
|
|
|
8859-1 characterset.
|
|
|
|
</para>
|
|
|
|
</note>
|
|
|
|
</refsect1>
|
|
|
|
|
|
|
|
<refsect1 role="seealso">
|
|
|
|
&reftitle.seealso;
|
2007-06-15 19:01:26 +00:00
|
|
|
<para>
|
2007-06-15 19:01:57 +00:00
|
|
|
<simplelist>
|
|
|
|
<member><function>htmlentities</function></member>
|
|
|
|
<member><function>htmlspecialchars</function></member>
|
|
|
|
<member><function>get_html_translation_table</function></member>
|
|
|
|
<member><function>urldecode</function></member>
|
|
|
|
</simplelist>
|
2007-06-15 19:01:26 +00:00
|
|
|
</para>
|
|
|
|
</refsect1>
|
2007-06-15 19:01:57 +00:00
|
|
|
|
2007-06-15 19:01:26 +00:00
|
|
|
</refentry>
|
2002-11-18 09:28:42 +00:00
|
|
|
|
|
|
|
<!-- Keep this comment at the end of the file
|
|
|
|
Local variables:
|
|
|
|
mode: sgml
|
|
|
|
sgml-omittag:t
|
|
|
|
sgml-shorttag:t
|
|
|
|
sgml-minimize-attributes:nil
|
|
|
|
sgml-always-quote-attributes:t
|
|
|
|
sgml-indent-step:1
|
|
|
|
sgml-indent-data:t
|
|
|
|
indent-tabs-mode:nil
|
|
|
|
sgml-parent-document:nil
|
2009-09-25 07:04:39 +00:00
|
|
|
sgml-default-dtd-file:"~/.phpdoc/manual.ced"
|
2002-11-18 09:28:42 +00:00
|
|
|
sgml-exposed-tags:nil
|
|
|
|
sgml-local-catalogs:nil
|
|
|
|
sgml-local-ecat-files:nil
|
|
|
|
End:
|
|
|
|
vim600: syn=xml fen fdm=syntax fdl=2 si
|
|
|
|
vim: et tw=78 syn=sgml
|
|
|
|
vi: ts=1 sw=1
|
|
|
|
-->
|