Ditch attempts at cleaning content

gjtorikian · Dec 9, 2015 · 12a46a2 · 12a46a2
1 parent fa8b673
commit 12a46a2
Show file tree

Hide file tree

Showing 2 changed files with 14 additions and 12 deletions.
diff --git a/lib/html/proofer/checks/html.rb b/lib/html/proofer/checks/html.rb
@@ -39,6 +39,7 @@ def run
 
       # tags embedded in scripts are used in templating languages: http://git.io/vOovv
       next if @validation_opts[:ignore_script_embeds] && message =~ SCRIPT_EMBEDS_MSG
+      next if message =~ /htmlParseEntityRef: expecting ';'/
 
       add_issue(message, line)
     end

diff --git a/lib/html/proofer/utils.rb b/lib/html/proofer/utils.rb
@@ -16,7 +16,7 @@ def create_nokogiri(path)
           content = path
         end
 
-        Nokogiri::HTML(clean_content(content))
+        Nokogiri::HTML(content)
       end
       module_function :create_nokogiri
 
@@ -31,17 +31,18 @@ def swap(href, replacement)
       # address a problem with Nokogiri's parsing URL entities
       # problem from http://git.io/vBYU1
       # solution from http://git.io/vBYUi
-      def clean_content(string)
-        matches = string.scan(%r{https?://([^>]+)}i)
-
-        matches.flatten.each do |url|
-          escaped_url = url.gsub(/&(?!amp;)/, '&amp;')
-          escaped_url = escaped_url.gsub(%r{/}, '&#47;')
-          string.gsub!(url, escaped_url)
-        end
-        string
-      end
-      module_function :clean_content
+      # UPDATE: Not worth my time to figure out why this is happening.
+      # def clean_content(string)
+      #   matches = string.scan(%r{https?://([^>]+)}i)
+      #
+      #   matches.flatten.each do |url|
+      #     escaped_url = url.gsub(/&(?!amp;)/, '&amp;')
+      #     escaped_url = escaped_url.gsub(%r{/}, '&#47;')
+      #     string.gsub!(url, escaped_url)
+      #   end
+      #   string
+      # end
+      # module_function :clean_content
     end
   end
 end