require 'xsd/xmlparser'
require 'xmlscan/scanner'
module XSD
module XMLParser
class XMLScanner < XSD::XMLParser::Parser
include XMLScan::Visitor
def do_parse(string_or_readable)
@attrs = {}
@curattr = nil
@scanner = XMLScan::XMLScanner.new(self)
@scanner.kcode = XSD::Charset.charset_str(charset) if charset
@scanner.parse(string_or_readable)
end
def scanner_kcode=(charset)
@scanner.kcode = XSD::Charset.charset_str(charset) if charset
self.xmldecl_encoding = charset
end
ENTITY_REF_MAP = {
'lt' => '<',
'gt' => '>',
'amp' => '&',
'quot' => '"',
'apos' => '\''
}
def parse_error(msg)
raise ParseError.new(msg)
end
def wellformed_error(msg)
raise NotWellFormedError.new(msg)
end
def valid_error(msg)
raise NotValidError.new(msg)
end
def warning(msg)
p msg if $DEBUG
end
def on_xmldecl_version(str)
end
def on_xmldecl_encoding(str)
self.scanner_kcode = str
end
def on_chardata(str)
characters(str)
end
def on_etag(name)
end_element(name)
end
def on_entityref(ref)
characters(ENTITY_REF_MAP[ref])
end
def on_charref(code)
characters([code].pack('U'))
end
def on_charref_hex(code)
on_charref(code)
end
def on_stag(name)
@attrs = {}
end
def on_attribute(name)
@attrs[name] = @curattr = ''
end
def on_attr_value(str)
@curattr << str
end
def on_attr_entityref(ref)
@curattr << ENTITY_REF_MAP[ref]
end
def on_attr_charref(code)
@curattr << [code].pack('U')
end
def on_attr_charref_hex(code)
on_attr_charref(code)
end
def on_stag_end_empty(name)
on_stag_end(name)
on_etag(name)
end
def on_stag_end(name)
start_element(name, @attrs)
end
add_factory(self)
end
end
end