diff --git a/src/Readability.php b/src/Readability.php index ebf6844..1ed93ea 100644 --- a/src/Readability.php +++ b/src/Readability.php @@ -157,7 +157,7 @@ class Readability implements LoggerAwareInterface // replace excessive br's '/\s*

']+/>!is' => '', + '!<(?:a|div|p|figure)[^>]+/>!is' => '', // remove all attributes on text tags //'!<(\s*/?\s*(?:blockquote|br|hr|code|div|article|span|footer|aside|p|pre|dl|li|ul|ol)) [^>]+>!is' => "<\\1>", //single newlines cleanup