package Catmandu::Fix::trim;
use Catmandu::Sane;
our $VERSION = '1.0507';
use Moo;
use Unicode::Normalize;
use namespace::clean;
use Catmandu::Fix::Has;
has path => (fix_arg => 1);
has mode => (fix_arg => 1, default => sub {'whitespace'});
with 'Catmandu::Fix::SimpleGetValue';
sub emit_value {
my ($self, $var) = @_;
my $perl = "if (is_string(${var})) {";
if ($self->mode eq 'whitespace') {
$perl .= "${var} = trim(${var});";
}
elsif ($self->mode eq 'nonword') {
$perl .= $var . ' =~ s/^\W+//;';
$perl .= $var . ' =~ s/\W+$//;';
}
elsif ($self->mode eq 'diacritics') {
$perl .= "${var} = Unicode::Normalize::NFKD(${var});";
$perl .= "${var} =~ s/\\p{NonspacingMark}//g;";
}
$perl .= "}";
$perl;
}
1;
__END__
=pod
=encoding utf-8
=head1 NAME
Catmandu::Fix::trim - trim leading and ending junk from the value of a field
=head1 SYNOPSIS
# the default mode trims whitespace
# e.g. foo => ' abc ';
trim(foo) # foo => 'abc';
trim(foo, whitespace) # foo => 'abc';
# trim non-word characters
# e.g. foo => ' abc / : .';
trim(foo, nonword) # foo => 'abc';
# trim accents
# e.g. foo => 'français' ;
trim(foo,diacritics) # foo => 'francais'
=head1 SEE ALSO
L<Catmandu::Fix>
=cut