package RDF::Trine::Parser::ShorthandRDF;

use utf8;
use 5.010;
use strict;
use warnings;
no warnings 'redefine';
no warnings 'once';
use base qw(RDF::Trine::Parser::Notation3);
use RDF::Trine qw(literal);
use RDF::Trine::Statement;
use RDF::Trine::Namespace;
use RDF::Trine::Node;
use RDF::Trine::Error;
use Scalar::Util qw(blessed looks_like_number);

our ($VERSION, $AUTHORITY);

BEGIN 
{
	$VERSION   = '0.204';
	$AUTHORITY = 'cpan:TOBYINK';
	
	my $class = __PACKAGE__;
	$RDF::Trine::Parser::encodings{$class } = 'utf8';
	$RDF::Trine::Parser::canonical_media_types{ $class } = 'text/x.shorthand-rdf';
	
	$RDF::Trine::Parser::parser_names{$_} = __PACKAGE__
		foreach ('shorthand', 'shorthandrdf');
	
	$RDF::Trine::Parser::media_types{$_} = __PACKAGE__
		foreach qw(text/x.shorthand-rdf text/x-shorthand-rdf);
	
	$RDF::Trine::Parser::file_extensions{$_} = __PACKAGE__
		foreach qw(n3x);

	$RDF::Trine::Parser::format_uris{$_} = __PACKAGE__
		foreach ('http://buzzword.org.uk/2010/n3x');
}

# Force the default prefix to be bound to the base URI.
sub _Document {
	my $self	= shift;
	my $uri  = $self->{'baseURI'};
	$self->{bindings}     = {};
	$self->{bindings}{''} = ($uri =~ /#$/ ? $uri : "${uri}#");
	$self->{keywords}     = undef;
	$self->{shorthands}   = [];
	$self->{pragmata}     = {};
	$self->_apply_profile($self->{baseURI}, $self->{profile}, 0)
		if defined $self->{profile} && length $self->{profile};
	$self->SUPER::_Document(@_);
}

sub _triple {
	my ($self, $s, $p, $o) = @_;
	
	if (defined $self->{pragmata}{rdf}
	and $self->{pragmata}{rdf}->is_literal
	and lc $self->{pragmata}{rdf}->literal_value eq 'true')
	{
		my $st = RDF::Trine::Statement->new($s, $p, $o);
		throw RDF::Trine::Error::ParserError -text => ("Non-RDF triple in RDF-only mode: ".$st->sse)
			unless $st->rdf_compatible && !$o->isa('RDF::Trine::Node::Formula');
	}

	if (defined $self->{pragmata}{'blank-nodes'}
	and $self->{pragmata}{'blank-nodes'}->is_literal
	and lc $self->{pragmata}{'blank-nodes'}->literal_value eq 'false')
	{
		my $st = RDF::Trine::Statement->new($s, $p, $o);
		throw RDF::Trine::Error::ParserError -text => ("Blank node found: ".$st->sse)
			if grep { $_->is_blank } ($s, $p, $o);
	}

	if (defined $self->{pragmata}{trig}
	and $self->{pragmata}{trig}->is_literal
	and lc $self->{pragmata}{trig}->literal_value eq 'true'
	and $s->is_resource
	and $p->is_resource
	and $p->uri eq 'http://www.w3.org/2002/07/owl#sameAs'
	and $o->isa('RDF::Trine::Node::Formula')
	and (my $code = $self->{handle_triple}))
	{
		foreach my $st ($o->pattern->triples)
		{
			my ($S, $P, $O) = $st->nodes;
			
			if ($self->{canonicalize}
			and $O->isa('RDF::Trine::Node::Literal')
			and $O->has_datatype)
			{
				my $canon = RDF::Trine::Node::Literal->canonicalize_literal_value(
					$O->literal_value, $O->literal_datatype, 1);
				$O = RDF::Trine::Node::Literal->new($canon, undef, $O->literal_datatype);
			}
			
			my $quad = RDF::Trine::Statement::Quad->new($S, $P, $O, $s);
			$code->($quad);
		}
		
		return;
	}
	
	$self->SUPER::_triple($s, $p, $o);
}

sub __consume_ws {
	my $self	= shift;
	BIT: while ($self->{tokens} =~ m/^[\t\r\n #]/)
	{
		if ($self->{tokens} =~ m/^[#]/)
		{
			foreach my $shorthand ( reverse @{ $self->{shorthands} } )
			{
				my ($type, $pattern, $full, $basethen) = @$shorthand;
				last BIT if ($type eq '@pattern' and $self->{tokens} =~ $pattern);
			}
		}
		
		$self->_ws();
	}
}


sub _directive_test {
	my $self	= shift;
	if ($self->{tokens} =~ m/^\@(base|prefix|forSome|forAll|keywords|namepattern|dtpattern|pattern|term|profile|import|pragma)\b/io) {
		return 1;
	} else {
		return 0;
	}
}

# Shorthand-specific directives
sub _directive {
	my $self	= shift;
	if ($self->_at_pragma_test()) {
		$self->_at_pragma();
	} elsif ($self->_at_namepattern_test()) {
		$self->_at_namepattern();
	} elsif ($self->_at_dtpattern_test()) {
		$self->_at_dtpattern();
	} elsif ($self->_at_term_test()) {
		$self->_at_term();
	} elsif ($self->_at_pattern_test()) {
		$self->_at_pattern();
	} elsif ($self->_at_profile_test()) {
		$self->_at_profile();
	} else {
		$self->SUPER::_directive(@_);
	}
}

sub _at_namepattern_test {
	my $self = shift;
	return $self->__startswith('@namepattern');
}

sub _at_dtpattern_test {
	my $self = shift;
	return $self->__startswith('@dtpattern');
}

sub _at_term_test {
	my $self = shift;
	return $self->__startswith('@term');
}

sub _at_pragma_test {
	my $self = shift;
	return $self->__startswith('@pragma');
}

sub _at_pattern_test {
	my $self = shift;
	return $self->__startswith('@pattern');
}

sub _at_profile_test {
	my $self = shift;
	return $self->__startswith('@profile') || $self->__startswith('@import');
}

sub _at_namepattern {
	my $self	= shift;
	
	$self->_eat('@namepattern');
	$self->_ws();
	$self->__consume_ws();
	
	my $pattern = $self->_literal()->literal_value;
	$self->__consume_ws();
	
	my $uri = $self->_uriref();
	$self->__consume_ws();

	push @{ $self->{shorthands} }, ['@pattern', qr/^($pattern)/, RDF::Trine::Node::Resource->new($uri.'$0'), $self->{baseURI}];
	return $self->{shorthands}[-1];
}

sub _at_pattern {
	my $self	= shift;
	
	$self->_eat('@pattern');
	$self->_ws();
	$self->__consume_ws();
	
	my $pattern = $self->_literal()->literal_value;
	$self->__consume_ws();
	
	my $thing;
	local($self->{suspend_callback}) = 1;
	if ($self->_resource_test)
		{ $thing = $self->_resource(); }
	else
		{ $thing = $self->_literal(); }
	$self->__consume_ws();

	push @{ $self->{shorthands} }, ['@pattern', qr/^($pattern)/, $thing, $self->{baseURI}];
	return $self->{shorthands}[-1];
}

sub _at_dtpattern {
	my $self	= shift;
	
	$self->_eat('@dtpattern');
	$self->_ws();
	$self->__consume_ws();
	
	my $pattern = $self->_literal()->literal_value;
	$self->__consume_ws();
	
	my $uri = $self->_uriref();
	$self->__consume_ws();

	push @{ $self->{shorthands} }, ['@pattern', qr/^($pattern)/, RDF::Trine::Node::Literal->new('$0', undef, $uri), $self->{baseURI}];
	return $self->{shorthands}[-1];
}

sub _at_term {
	my $self	= shift;
	
	$self->_eat('@term');
	$self->_ws();
	$self->__consume_ws();
	
	my $token;
	
	if ( $self->{'tokens'} =~ m/^([A-Za-z_][A-Za-z0-9_-]*)\s/o )
	{
		$token = $1;
		$self->_eat($token);
	}
	else
	{
		$self->_eat('token_name'); # and die!
	}
	$self->__consume_ws();

	local($self->{suspend_callback}) = 1;
	my $thing = $self->_any_node();
	$self->__consume_ws();

	push @{ $self->{shorthands} }, ['@term', $token, $thing];
	return $self->{shorthands}[-1];
}

sub _at_pragma {
	my $self	= shift;
	
	$self->_eat('@pragma');
	$self->_ws();
	$self->__consume_ws();
	
	my $token;
	
	if ( $self->{'tokens'} =~ m/^([A-Za-z_][A-Za-z0-9_-]*)\s/o )
	{
		$token = $1;
		$self->_eat($token);
	}
	else
	{
		$self->_eat('token_name'); # and die!
	}
	$self->__consume_ws();

	local($self->{suspend_callback}) = 1;
	my $value = $self->_any_node();
	$self->__consume_ws();

	return $self->{pragmata}{$token} = $value;
}

sub _at_profile {
	my $self	= shift;
	
	my $import = 0;
	if ($self->__startswith('@profile'))
		{ $self->_eat('@profile'); }
	else
		{ $self->_eat('@import'); $import++; }
	
	$self->_ws();
	$self->__consume_ws();
	
	my $url = $self->_uriref();
	$self->__consume_ws();
	
	$url = $self->__URI($url, $self->{baseURI})->uri;
	
	$self->{handle_triple}->(RDF::Trine::Statement->new(
		$self->__URI('', $self->{baseURI}),
		RDF::Trine::Node::Resource->new('http://www.w3.org/2002/07/owl#imports'),
		RDF::Trine::Node::Resource->new($url),		
		)) if $import;

	my $ua = LWP::UserAgent->new(agent => "RDF::TriN3/$RDF::TriN3::VERSION");
	$ua->default_headers->push_header(Accept => 'text/x.shorthand-rdf, text/x-shorthand-rdf, text/n3, text/turtle');
	my $resp = $ua->get($url);
	unless ($resp->is_success) {
		throw RDF::Trine::Error::ParserError -text => $resp->status_line;
	}

	return $self->_apply_profile($resp->base, $resp->decoded_content, $import);
}

sub _apply_profile
{
	my ($self, $base, $data, $import) = @_;
	
	my $class = ref $self;
	my $child = $class->new(profile => '');
	$child->parse($base, $data, sub {
		$self->{handle_triple}->($_[0]) if $import;
	});
		
	my %child_bindings = %{ $child->{bindings} || {} };
	while (my ($prefix, $full) = each %child_bindings)
	{
		$self->{bindings}{$prefix} = $full
			if length $prefix;
	}
	
	push @{ $self->{shorthands} }, @{ $child->{shorthands} || [] };
	return $self->{shorthands}[-1];
}

sub _resource_test {
	my $self	= shift;
	return 0 unless (length($self->{tokens}));
	
	my $rv = $self->SUPER::_resource_test(@_);
	return $rv if $rv;
	
	foreach my $shorthand ( reverse @{ $self->{shorthands} } )
	{
		my ($type, $pattern, $full, $basethen) = @$shorthand;
		
		if ($type eq '@pattern' and $self->{'tokens'} =~ $pattern)
			{ return 1; }
		elsif ($type eq '@term' and $self->__startswith($pattern))
			{ return 1; }
	}	

	return 0;
}

sub _resource {
	my $self	= shift;

	foreach my $shorthand ( reverse @{ $self->{shorthands} } )
	{
		my ($type, $pattern, $full, $basethen) = @$shorthand;
		
		if ($type eq '@pattern' and $self->{'tokens'} =~ $pattern)
		{
			my $token = $1;
			$self->_eat($token);
			
			if ($full->is_literal && $full->has_datatype)
			{
				my $replaced_uri = $self->_PATTERN_($token, $pattern, $full->literal_datatype);
				my $absolute_uri = $self->__URI($replaced_uri, $basethen);
				return $self->__Literal(
					$self->_PATTERN_($token, $pattern, $full->literal_value),
					undef,
					$absolute_uri,
					);
			}
			elsif ($full->is_literal)
			{
				return $self->__Literal(
					$self->_PATTERN_($token, $pattern, $full->literal_value),
					($full->has_language ? $self->_PATTERN_($token, $pattern, $full->literal_value_language) : undef),
					);
			}
			elsif ($full->is_resource)
			{
				my $replaced_uri = $self->_PATTERN_($token, $pattern, $full->uri);
				return $self->__URI($replaced_uri, $basethen);
			}
		}
		elsif ($type eq '@term' and $self->__startswith($pattern))
		{
			$self->_eat($pattern);
			return $full;
		}
	}	

	return $self->SUPER::_resource(@_);
}

sub _PATTERN_
{
	my ($self, $thingy, $pattern, $template) = @_;

	return unless defined $template;
	$template = "$template";
	return $template unless $template =~ /\$/;

	my %vals = (0 => $thingy);
	my @matches = ($thingy =~ /$pattern/);
	for (my $i=0; $i <= $#matches; $i++)
	{
		$vals{$i + 1} = $matches[$i];
	}
	foreach my $bufname (keys %-)
	{
		$vals{$bufname} = $-{$bufname}->[0];
	}
	
	my $orig_template = $template;
	
	my $rv = '';
	my $count = 0;
	while (length $template)
	{
		$count++;
		die if $count > 300;
		
		if ((substr $template, 0, 1) eq '$')
		{
			$template = substr $template, 1;
			
			my $buffer;
			if ($template =~ /^ \{ ([^\}]+) \} (.*) $/xo)
			{
				($buffer, $template) = ($1, $2);
			}
			elsif ($template =~ /^(\d+)/o)
			{
				$buffer = $1;
				$template = substr($template, length $buffer);
			}
			elsif ($template =~ /^([_A-Za-z][_A-Za-z0-9]*)/o)
			{
				$buffer = $1;
				$template = substr($template, length $buffer);
			}
			else
			{
				throw RDF::Trine::Error::ParserError -text => "Unexpected pattern in replace: ${orig_template}\n";
			}
			$rv .= $vals{$buffer};
		}
		else
		{
			my ($start, $rest) = split /\$/, $template, 2;
			$rv .= $start;
			$template = '$'.(defined $rest ? $rest : '');
		}
	}

	return $rv;
}

1;

__END__

=head1 NAME

RDF::Trine::Parser::ShorthandRDF - Shorthand RDF Parser

=head1 SYNOPSIS

 use RDF::Trine::Parser;
 my $parser     = RDF::Trine::Parser->new( 'ShorthandRDF' );
 $parser->parse_into_model( $base_uri, $data, $model );

=head1 DESCRIPTION

ShorthandRDF is an extension of N3 syntax. It's currently defined at
L<http://esw.w3.org/ShorthandRDF>.

=head2 Methods

This package exposes the same methods as RDF::Trine::Parser::Notation3.

=head1 BUGS

Please report any bugs to
L<http://rt.cpan.org/Dist/Display.html?Queue=RDF-TriN3>.

=head1 SEE ALSO

L<RDF::TriN3>,
L<RDF::Trine::Parser::Pretdsl>,
L<RDF::Trine::Parser::Notation3>.

L<http://esw.w3.org/ShorthandRDF>.

=head1 AUTHOR

Toby Inkster  C<< <tobyink@cpan.org> >>

Based on RDF::Trine::Parser::Turtle by Gregory Todd Williams. 

=head1 COPYRIGHT AND LICENCE

Copyright (c) 2006-2010 Gregory Todd Williams. 

Copyright (c) 2010-2012 Toby Inkster.

This library is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.

=head1 DISCLAIMER OF WARRANTIES

THIS PACKAGE IS PROVIDED "AS IS" AND WITHOUT ANY EXPRESS OR IMPLIED
WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
MERCHANTIBILITY AND FITNESS FOR A PARTICULAR PURPOSE.

=cut