- Fix html entities replacement (related to r2186)

release-0.6
alecpl 16 years ago
parent e1c2e7271e
commit 755900cd6a

@ -176,7 +176,6 @@ class html2text
'/&(bull|#149|#8226);/i', // Bullet
'/&(pound|#163);/i', // Pound sign
'/&(euro|#8364);/i', // Euro sign
'/&[^&;]+;/i', // Unknown/unhandled entities
'/[ ]{2,}/' // Runs of spaces, post-handling
);
@ -220,7 +219,6 @@ class html2text
'*',
'£',
'EUR', // Euro sign. € ?
'', // Unknown/unhandled entities
' ' // Runs of spaces, post-handling
);
@ -475,6 +473,9 @@ class html2text
// Replace known html entities
$text = html_entity_decode($text, ENT_COMPAT, 'UTF-8');
// Remove unknown/unhandled entities (this cannot be done in search-and-replace block)
$text = preg_replace('/&[^&;]+;/i', '', $text);
// Strip any other HTML tags
$text = strip_tags($text, $this->allowed_tags);

Loading…
Cancel
Save