class Nokogiri::HTML::SAX::Parser
For more information on SAX parsers, see Nokogiri::XML::SAX<br><br>parser.parse(File.read(ARGV, ‘rb’))
parser = Nokogiri::HTML::SAX::Parser.new(MyDoc.new)
end
end
puts “found a #{name}”
def start_element name, attributes = []
class MyDoc < Nokogiri::XML::SAX::Document
Here is a basic usage example:
error correction.
This class lets you perform SAX style parsing on HTML with HTML
##
def parse_file filename, encoding = 'UTF-8'
##
def parse_file filename, encoding = 'UTF-8' raise ArgumentError unless filename raise Errno::ENOENT unless File.exists?(filename) raise Errno::EISDIR if File.directory?(filename) ctx = ParserContext.file(filename, encoding) yield ctx if block_given? ctx.parse_with self end
def parse_memory data, encoding = 'UTF-8'
##
def parse_memory data, encoding = 'UTF-8' raise ArgumentError unless data return unless data.length > 0 ctx = ParserContext.memory(data, encoding) yield ctx if block_given? ctx.parse_with self end