X-Git-Url: https://git.netwichtig.de/gitweb/?a=blobdiff_plain;f=lib%2Frbot%2Fcore%2Futils%2Fextends.rb;h=7022fb9123ac17b2d3df543e0d0f66002bbea342;hb=bc9e991b8665fdd8f77a257c5381cf70d015a6ec;hp=c43f3f3bf1b55ab292ac92b45a00165336f09eba;hpb=8b45e3f06184a66bd5bfa578c194059a8cf8ceb4;p=user%2Fhenk%2Fcode%2Fruby%2Frbot.git diff --git a/lib/rbot/core/utils/extends.rb b/lib/rbot/core/utils/extends.rb index c43f3f3b..7022fb91 100644 --- a/lib/rbot/core/utils/extends.rb +++ b/lib/rbot/core/utils/extends.rb @@ -51,22 +51,32 @@ class ::String ## Maybe make it configurable? # txt.gsub!(/<\/?a( [^>]*)?>/, "#{Reverse}") - # Paragraph and br tags are converted to whitespace. + # Paragraph and br tags are converted to whitespace txt.gsub!(/<\/?(p|br)\s*\/?\s*>/, ' ') txt.gsub!("\n", ' ') + txt.gsub!("\r", ' ') # All other tags are just removed txt.gsub!(/<[^>]+>/, '') + # Convert HTML entities. We do it now to be able to handle stuff + # such as   + txt = Utils.decode_html_entities(txt) + # Remove double formatting options, since they only waste bytes txt.gsub!(/#{Bold}(\s*)#{Bold}/, '\1') txt.gsub!(/#{Underline}(\s*)#{Underline}/, '\1') + # Simplify whitespace that appears on both sides of a formatting option + txt.gsub!(/\s+(#{Bold}|#{Underline})\s+/, ' \1') + txt.sub!(/\s+(#{Bold}|#{Underline})\z/, '\1') + txt.sub!(/\A(#{Bold}|#{Underline})\s+/, '\1') + # And finally whitespace is squeezed txt.gsub!(/\s+/, ' ') # Decode entities and strip whitespace - return Utils.decode_html_entities(txt).strip! + return txt.strip end # This method will strip all HTML crud from the receiver