Module: PragmaticSegmenter::Cleaner::Rules::HTML

Defined in:
lib/pragmatic_segmenter/cleaner/rules.rb

Constant Summary collapse

HTMLTagRule =
Rule.new(/<\/?\w+((\s+\w+(\s*=\s*(?:".*?"|'.*?'|[\^'">\s]+))?)+\s*|\s*)\/?>/, '')
EscapedHTMLTagRule =
Rule.new(/&lt;\/?[^gt;]*gt;/, '')
All =
[HTMLTagRule, EscapedHTMLTagRule]