The Perl Toolchain Summit needs more sponsors. If your company depends on Perl, please support this very important event.
package Catmandu::Fix::trim;

use Catmandu::Sane;

our $VERSION = '1.0603';

use Moo;
use Unicode::Normalize;
use namespace::clean;
use Catmandu::Fix::Has;

has path => (fix_arg => 1);
has mode => (fix_arg => 1, default => sub {'whitespace'});

with 'Catmandu::Fix::SimpleGetValue';

sub emit_value {
    my ($self, $var) = @_;

    my $perl = "if (is_string(${var})) {";
    if ($self->mode eq 'whitespace') {
        $perl .= "${var} = trim(${var});";
    }
    elsif ($self->mode eq 'nonword') {
        $perl .= $var . ' =~ s/^\W+//;';
        $perl .= $var . ' =~ s/\W+$//;';
    }
    elsif ($self->mode eq 'diacritics') {
        $perl .= "${var} = Unicode::Normalize::NFKD(${var});";
        $perl .= "${var} =~ s/\\p{NonspacingMark}//g;";
    }
    $perl .= "}";
    $perl;
}

1;

__END__

=pod

=encoding utf-8

=head1 NAME

Catmandu::Fix::trim - trim leading and ending junk from the value of a field

=head1 SYNOPSIS

   # the default mode trims whitespace
   # e.g. foo => '   abc   ';

   trim(foo) # foo => 'abc';
   trim(foo, whitespace) # foo => 'abc';
   
   # trim non-word characters
   # e.g. foo => '   abc  / : .';
   trim(foo, nonword) # foo => 'abc';

   # trim accents
   # e.g. foo => 'français' ;
   trim(foo,diacritics) # foo => 'francais'
   
=head1 SEE ALSO

L<Catmandu::Fix>

=cut