GOBO::Parsers::Parser - GOBO::Parsers::Parser documentation


GOBO documentation Contained in the GOBO distribution.

Index


Code Index:

NAME

Top

GOBO::Parsers::Parser

SYNOPSIS

Top

  my $p = GOBO::Parser->new;
  $p->parse_file(file => $file, options => $option_h);
  $g = $p->graph;

DESCRIPTION

Top

Base class for all parsers. Parsers take formats (e.g. GOBO::Parsers::OBOParser) and generate objects, typically some combination of GOBO::Node and GOBO::Statement objects

parse_file

$parser->parse_file(file => '/path/to/file', options => $option_h)

input: self file => $f_name # either as /path/to/filename or a FileHandle object options => $opt_h # a hash of options [optional]

The file will be parsed according to the options This method does not return anything; instead, the parser object can be queried for the results.

parse

$parser->parse(options => $option_h)

input: self options => $opt_h # a hash of options [optional]

Parse according to the options. Note that the file to be parsed should already have been specified.

This method does not return anything; instead, the parser object can be queried for the results.

parse_chunk

$parser->parse_chunk(size => 50, options => $option_h)

input: self size => 1000 # the number of lines to parse options => $opt_h # a hash of options [optional]

Parse according to the options. Note that the file to be parsed should already have been specified.

This method does not return anything; instead, the parser object can be queried for the results.

set_file

$parser->set_file($f_name)

input: self $f_name # either as /path/to/filename or a FileHandle object

Set the parser to parse a certain file

set_options

input: self, hash ref of options

Sets a hash of options, accessed by $self->options.

Existing options will remain intact.

set_all_options

input: self, hash ref of options

Sets a hash of options, accessed by $self->options.

Existing options are deleted.

clear_options

input: self, arrayref of strings corresponding to keys in the 'options' hash

Removes key(s) from the options hash

clear_all_options

Delete everything from the options hash

reset_parser

$self->reset_parser

Removes the file handle, data, and options from the parser

reset_temporary_variables

$self->reset_temporary_variables

These variables should be reset every time the parser is used on a new file


GOBO documentation Contained in the GOBO distribution.
package GOBO::Parsers::Parser;
use Moose;
use Moose::Util::TypeConstraints;
#use GOBO::Graph;
use FileHandle;
use Carp;

subtype 'GOBO::Parsers::Parser::ProtoFileHandle' => as class_type('FileHandle');

coerce 'GOBO::Parsers::Parser::ProtoFileHandle'
	=> from 'Str'
		=> via { FileHandle->new( $_ ) }
	=> from 'FileHandle'
		=> via { $_ };

has data => (is=>'rw', isa => 'HashRef', clearer => 'clear_data');

has fh => (is=>'rw', isa=>'GOBO::Parsers::Parser::ProtoFileHandle', clearer=>'clear_fh', predicate=>'has_fh', writer=>'_set_fh', coerce => 1, init_arg => 'file', trigger => \&reset_temporary_variables );
has lines => (is=>'rw', isa=>'ArrayRef',default=>sub{[]});
has line_no => (is=>'rw', isa=>'Int', default=>sub{0});
has parsed_header => (is=>'rw', isa=>'Bool');
has stalled => (is=>'rw', isa=>'Bool');

has max_chunk => (is=>'rw', isa=>'Int', init_arg => 'size', clearer=>'clear_max_chunk');

has options => (is => 'rw', isa => 'HashRef', clearer => 'clear_all_options', trigger => \&reset_checked_options );
has checked_options => (is => 'rw', isa => 'Bool');
has header_parser_options => (is => 'rw', isa => 'HashRef', clearer => 'clear_header_parser_options', predicate => 'has_header_parser_options', writer => 'set_header_parser_options');
has body_parser_options => (is => 'rw', isa => 'HashRef', clearer => 'clear_body_parser_options', predicate => 'has_body_parser_options', writer => 'set_body_parser_options');

has liberal_mode => (is=>'rw', isa=>'Bool',default=>sub{1});

sub BUILDARGS {
	my $class = shift;
	return $class->SUPER::BUILDARGS(@_) unless ( @_ );
	my %arg_h = ( @_ );

	if ( $arg_h{fh} ) {
		$arg_h{file} = $arg_h{fh};
		delete $arg_h{fh};
	}
	return \%arg_h;
}


sub parse_file {
	my $self = shift;
	my %args;
	# allow parse_file('/path/to/file')
	if (scalar @_ == 1)
	{	$args{file} = shift;
	}
	else
	{	%args = (@_);
	}
	
	# initialize the fh
	$self->set_fh($args{file});
	$self->set_options($args{options}) if $args{options};
	
	# parse the file
	$self->_parse;

	return 1;
}


sub parse {
	my $self = shift;
	confess "No file handle present!" unless $self->has_fh;

	my %args = (@_);
	$self->set_options($args{options}) if $args{options};

	return $self->_parse;
}


sub parse_chunk {
	my $self = shift;
	if ($self->parsed_header && ! $self->stalled) {
		return 0;
	}
	confess "No file handle present!" unless $self->has_fh;
	my %args = (@_);
	$self->max_chunk($args{size}) if $args{size};
	$self->set_options($args{options}) if $args{options};
	return $self->_parse;
}



sub _parse {
	my $self = shift;
	return 0 unless $self->has_fh;
	
	# make sure we've checked our parser options
	$self->check_options;
	if ($self->parsed_header)
	{	
            #print STDERR "Header has been parsed!\n";
            #print STDERR "parser: " . $self->dump(2) . "\n";
	}
	else
	{	$self->parse_header;
	}
	$self->parse_body;

	# close the file handle
#	$self->fh->close if ! $self->stalled;
	return 1;
}



sub create {
	my $proto = shift;
	my %argh = @_;
	my $fmt = $argh{format};
	if ($fmt) {
		my $pc;
		if ($fmt eq 'obo') {
			$pc = 'GOBO::Parsers::OBOParser';
		}
		#require $pc;
		return $pc->new(%argh);
	}
}


sub set_file {
	my $self = shift;
	my $f = shift || die "No file specified! Dying";

	# clear the existing fh
	$self->clear_fh;

	# if there is an argument passed
	# is it a filehandle?
	if (ref $f && ref $f eq 'FileHandle')
	{	$self->_set_fh($f);
		return;
	}
	elsif (! ref $f)
	{	my $fh;
		if ($f =~ /\.gz$/) {
                    $fh = FileHandle->new("gzip -dc $f |") or confess "Could not create a filehandle for $f: $! ";
		}
		else {
			$fh = FileHandle->new($f, "r") or confess "Could not create a filehandle for $f: $! ";
		}
		$self->_set_fh($fh);
		return;
	}
	# uh-oh, no FH in sight! :o
	confess "Could not find create a filehandle!";
}
*set_fh = \&set_file;


sub next_line {
	my $self = shift;
	my $fh = $self->fh;
	my $max_chunk = $self->max_chunk;
	my $line_no = $self->line_no + 1;
	$self->line_no($line_no);
	
	$self->stalled(0);
	if ($self->parsed_header && $max_chunk && $line_no > $max_chunk) {
		$self->line_no(0);
		$self->stalled(1);
		return undef;
	}
	my $lines = $self->lines;
	if (@$lines) {
		return shift @$lines;
	}
	
	my $line = <$fh>;
	return $line;
}


sub unshift_line {
	my $self = shift;
	$self->line_no($self->line_no - scalar(@_));
	unshift(@{$self->lines},@_);
	return;
}


sub set_options {
	my $self = shift;
	my $o = shift;
	my $options = $self->options;

	while ( my ( $k, $v ) = each %$o )
	{	$options->{$k} = $v;
	}
	
	if (! $options || ! keys %$options )
	{	$self->clear_all_options;
		return;
	}
	$self->options($options);
}

*set_option = \&set_options;


sub set_all_options {
	my $self = shift;
	my $o = shift;

	$self->clear_all_options;

	if (! $o || ! keys %$o )
	{	return;
	}

	$self->options($o);

}



sub clear_options {
	my $self = shift;
	my $o = shift;
	my $options = $self->options || {};

	# convert scalar to an array ref
	$o = [ $o ] if ! ref $o;

	foreach (@$o)
	{	delete $options->{$_};
	}

	if (! $options || ! keys %$options )
	{	$self->clear_all_options;
		return;
	}

	$self->options($options);

}

*clear_option = \&clear_options;


sub check_options {
	my $self = shift;
	$self->checked_options(1);
}

sub reset_checked_options {
	shift->checked_options(0);
}

sub reset_parser {
	my $self = shift;
	$self->clear_fh;
	$self->clear_all_options;
	$self->clear_data;
	$self->clear_max_chunk;
	$self->reset_temporary_variables;
}


sub reset_temporary_variables {
	my $self = shift;
	$self->parsed_header(0);
	$self->stalled(0);
	$self->line_no(0);
	$self->checked_options(0);
}


1;