From 755900cd6aef3e9808dfd76c797904a2c8b08bed Mon Sep 17 00:00:00 2001
From: alecpl <alec@alec.pl>
Date: Wed, 21 Jan 2009 02:55:09 -0500
Subject: [PATCH] - Fix html entities replacement (related to r2186)

---
 program/lib/html2text.php |    5 +++--
 1 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/program/lib/html2text.php b/program/lib/html2text.php
index e2a5b24..b00c28a 100644
--- a/program/lib/html2text.php
+++ b/program/lib/html2text.php
@@ -176,7 +176,6 @@
         '/&(bull|#149|#8226);/i',                // Bullet
         '/&(pound|#163);/i',                     // Pound sign
         '/&(euro|#8364);/i',                     // Euro sign
-        '/&[^&;]+;/i',                           // Unknown/unhandled entities
         '/[ ]{2,}/'                              // Runs of spaces, post-handling
     );
 
@@ -220,7 +219,6 @@
         '*',
         '£',
         'EUR',                                  // Euro sign. � ?
-        '',                                     // Unknown/unhandled entities
         ' '                                     // Runs of spaces, post-handling
     );
 
@@ -475,6 +473,9 @@
 	// Replace known html entities
 	$text = html_entity_decode($text, ENT_COMPAT, 'UTF-8');
 
+        // Remove unknown/unhandled entities (this cannot be done in search-and-replace block)
+        $text = preg_replace('/&[^&;]+;/i', '', $text); 
+
         // Strip any other HTML tags
         $text = strip_tags($text, $this->allowed_tags);
 

--
Gitblit v1.9.1