# # Copyright (C) 1998 Ken MacLeod # XML::SAX2Perl is free software; you can redistribute it and/or # modify it under the same terms as Perl itself. # # $Id: SAX2Perl.pm,v 1.3 1999/12/22 21:15:00 kmacleod Exp $ # use strict; package XML::SAX2Perl; use vars qw{ $VERSION }; # will be substituted by make-rel script $VERSION = "0.07"; sub new { my $type = shift; my $self = ($#_ == 0) ? shift : { @_ }; return bless $self, $type; } sub setDocumentLocator { my $self = shift; my $self->{Locator} = shift; } sub startDocument { my $self = shift; my @properties; if (defined $self->{Locator}) { push @properties, locator => $self->{Locator}; } $self->{DocumentHandler}->start_document(@properties); } sub endDocument { my $self = shift; $self->{DocumentHandler}->end_document; } sub startElement { my $self = shift; my $name = shift; my $atts = shift; # FIXME depends on how Perl SAX treats attributes $self->{DocumentHandler}->start_element(Name => $name, Attributes => $attributes); } sub endElement { my $self = shift; my $name = shift; $self->{DocumentHandler}->end_element(Name => $name); } sub characters { my $self = shift; my $ch = shift; my $start = shift; my $length = shift; $self->{DocumentHandler}->characters(Data => substr($ch, $start, $length)); } sub ignorableWhitespace { my $self = shift; my $ch = shift; my $start = shift; my $length = shift; $self->{DocumentHandler}->ignorable_whitespace(Data => substr($ch, $start, $length)); } sub processingInstruction { my $self = shift; my $target = shift; my $data = shift; $self->{DocumentHandler}->processing_instruction(Target => $target, Data => $data); } 1; __END__ =head1 NAME XML::SAX2Perl -- translate Java/CORBA style SAX methods to Perl methods =head1 SYNOPSIS use XML::SAX2Perl; $sax2perl = XML::SAX2Perl(Handler => $my_handler); $sax->setDocumentHandler($sax2perl); =head1 DESCRIPTION C is a SAX filter that translates Java/CORBA style SAX methods to Perl style method calls. This man page summarizes the specific options, handlers, and properties supported by C; please refer to the Perl SAX standard C for general usage information. =head1 METHODS =over 4 =item new Creates a new parser object. Default options for parsing, described below, are passed as key-value pairs or as a single hash. Options may be changed directly in the parser object unless stated otherwise. Options passed to `C' override the default options in the parser object for the duration of the parse. =item parse Parses a document. Options, described below, are passed as key-value pairs or as a single hash. Options passed to `C' override default options in the parser object. =item location Returns the location as a hash: ColumnNumber The column number of the parse. LineNumber The line number of the parse. PublicId A string containing the public identifier, or undef if none is available. SystemId A string containing the system identifier, or undef if none is available. =item SAX DocumentHandler Methods The following methods are DocumentHandler methods that the SAX 1.0 parser will call and C will translate to Perl SAX methods calls. See SAX 1.0 for details. setDocumentLocator(locator) startDocument() endDocument() startElement(name, atts) endElement(name) characters(ch, start, length) ignorableWhitespace(ch, start, length) processingInstruction(target, data) =back =head1 OPTIONS The following options are supported by C: Handler default handler to receive events DocumentHandler handler to receive document events DTDHandler handler to receive DTD events ErrorHandler handler to receive error events EntityResolver handler to resolve entities Locale locale to provide localisation for errors Source hash containing the input source for parsing If no handlers are provided then all events will be silently ignored, except for `C' which will cause a `C' to be called after calling `C'. If a single string argument is passed to the `C' method, it is treated as if a `C' option was given with a `C' parameter. The `C' hash may contain the following parameters: ByteStream The raw byte stream (file handle) containing the document. String A string containing the document. SystemId The system identifier (URI) of the document. PublicId The public identifier. Encoding A string describing the character encoding. If more than one of `C', `C', or `C', then preference is given first to `C', then `C', then `C'. =head1 HANDLERS The following handlers and properties are supported by C: =head2 DocumentHandler methods =over 4 =item start_document Receive notification of the beginning of a document. Locator An object that can return the location of any SAX document event. =item end_document Receive notification of the end of a document. No properties defined. =item start_element Receive notification of the beginning of an element. Name The element type name. Attributes Attributes attached to the element, if any. ALPHA WARNING: The `C' value is not translated from the SAX 1.0 value, so it will contain an AttributeList object. =item end_element Receive notification of the end of an element. Name The element type name. =item characters Receive notification of character data. Data The characters from the XML document. =item ignorable_whitespace Receive notification of ignorable whitespace in element content. Data The characters from the XML document. =item processing_instruction Receive notification of a processing instruction. Target The processing instruction target. Data The processing instruction data, if any. =back =head1 AUTHOR Ken MacLeod =head1 SEE ALSO perl(1), XML::Perl2SAX(3). Extensible Markup Language (XML) Simple API for XML (SAX) =cut